src/hotspot/cpu/x86/x86.ad
author mdoerr
Wed, 16 Oct 2019 11:52:56 +0200
changeset 58643 b381e5328461
parent 58516 d376d86b0a01
child 58679 9c3209ff7550
permissions -rw-r--r--
8232106: [x86] C2: SIGILL due to usage of SSSE3 instructions on processors which don't support it Reviewed-by: kvn, thartmann
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
     1
//
54022
ff399127078a 8217561: X86: Add floating-point Math.min/max intrinsics
bsrbnd
parents: 53639
diff changeset
     2
// Copyright (c) 2011, 2019, Oracle and/or its affiliates. All rights reserved.
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
     3
// DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
     4
//
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
     5
// This code is free software; you can redistribute it and/or modify it
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
     6
// under the terms of the GNU General Public License version 2 only, as
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
     7
// published by the Free Software Foundation.
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
     8
//
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
     9
// This code is distributed in the hope that it will be useful, but WITHOUT
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    10
// ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    11
// FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    12
// version 2 for more details (a copy is included in the LICENSE file that
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    13
// accompanied this code).
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    14
//
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    15
// You should have received a copy of the GNU General Public License version
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    16
// 2 along with this work; if not, write to the Free Software Foundation,
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    17
// Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    18
//
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    19
// Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    20
// or visit www.oracle.com if you need additional information or have any
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    21
// questions.
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    22
//
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    23
//
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    24
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    25
// X86 Common Architecture Description File
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    26
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    27
//----------REGISTER DEFINITION BLOCK------------------------------------------
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    28
// This information is used by the matcher and the register allocator to
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    29
// describe individual registers and classes of registers within the target
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    30
// archtecture.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    31
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    32
register %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    33
//----------Architecture Description Register Definitions----------------------
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    34
// General Registers
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    35
// "reg_def"  name ( register save type, C convention save type,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    36
//                   ideal register type, encoding );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    37
// Register Save Types:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    38
//
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    39
// NS  = No-Save:       The register allocator assumes that these registers
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    40
//                      can be used without saving upon entry to the method, &
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    41
//                      that they do not need to be saved at call sites.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    42
//
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    43
// SOC = Save-On-Call:  The register allocator assumes that these registers
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    44
//                      can be used without saving upon entry to the method,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    45
//                      but that they must be saved at call sites.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    46
//
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    47
// SOE = Save-On-Entry: The register allocator assumes that these registers
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    48
//                      must be saved before using them upon entry to the
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    49
//                      method, but they do not need to be saved at call
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    50
//                      sites.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    51
//
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    52
// AS  = Always-Save:   The register allocator assumes that these registers
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    53
//                      must be saved before using them upon entry to the
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    54
//                      method, & that they must be saved at call sites.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    55
//
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    56
// Ideal Register Type is used to determine how to save & restore a
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    57
// register.  Op_RegI will get spilled with LoadI/StoreI, Op_RegP will get
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    58
// spilled with LoadP/StoreP.  If the register supports both, use Op_RegI.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    59
//
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    60
// The encoding number is the actual bit-pattern placed into the opcodes.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    61
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    62
// XMM registers.  512-bit registers or 8 words each, labeled (a)-p.
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    63
// Word a in each register holds a Float, words ab hold a Double.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    64
// The whole registers are used in SSE4.2 version intrinsics,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    65
// array copy stubs and superword operations (see UseSSE42Intrinsics,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    66
// UseXMMForArrayCopy and UseSuperword flags).
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    67
// For pre EVEX enabled architectures:
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    68
//      XMM8-XMM15 must be encoded with REX (VEX for UseAVX)
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    69
// For EVEX enabled architectures:
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    70
//      XMM8-XMM31 must be encoded with REX (EVEX for UseAVX).
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    71
//
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    72
// Linux ABI:   No register preserved across function calls
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    73
//              XMM0-XMM7 might hold parameters
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    74
// Windows ABI: XMM6-XMM31 preserved across function calls
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    75
//              XMM0-XMM3 might hold parameters
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    76
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    77
reg_def XMM0 ( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    78
reg_def XMM0b( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    79
reg_def XMM0c( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    80
reg_def XMM0d( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    81
reg_def XMM0e( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    82
reg_def XMM0f( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    83
reg_def XMM0g( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    84
reg_def XMM0h( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    85
reg_def XMM0i( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    86
reg_def XMM0j( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    87
reg_def XMM0k( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    88
reg_def XMM0l( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    89
reg_def XMM0m( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    90
reg_def XMM0n( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    91
reg_def XMM0o( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    92
reg_def XMM0p( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    93
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    94
reg_def XMM1 ( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    95
reg_def XMM1b( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    96
reg_def XMM1c( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    97
reg_def XMM1d( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    98
reg_def XMM1e( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    99
reg_def XMM1f( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   100
reg_def XMM1g( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   101
reg_def XMM1h( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   102
reg_def XMM1i( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   103
reg_def XMM1j( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   104
reg_def XMM1k( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   105
reg_def XMM1l( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   106
reg_def XMM1m( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   107
reg_def XMM1n( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   108
reg_def XMM1o( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   109
reg_def XMM1p( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   110
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   111
reg_def XMM2 ( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   112
reg_def XMM2b( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   113
reg_def XMM2c( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   114
reg_def XMM2d( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   115
reg_def XMM2e( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   116
reg_def XMM2f( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   117
reg_def XMM2g( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   118
reg_def XMM2h( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   119
reg_def XMM2i( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   120
reg_def XMM2j( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   121
reg_def XMM2k( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   122
reg_def XMM2l( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   123
reg_def XMM2m( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   124
reg_def XMM2n( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   125
reg_def XMM2o( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   126
reg_def XMM2p( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   127
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   128
reg_def XMM3 ( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   129
reg_def XMM3b( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   130
reg_def XMM3c( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   131
reg_def XMM3d( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   132
reg_def XMM3e( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   133
reg_def XMM3f( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   134
reg_def XMM3g( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   135
reg_def XMM3h( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   136
reg_def XMM3i( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   137
reg_def XMM3j( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   138
reg_def XMM3k( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   139
reg_def XMM3l( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   140
reg_def XMM3m( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   141
reg_def XMM3n( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   142
reg_def XMM3o( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   143
reg_def XMM3p( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   144
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   145
reg_def XMM4 ( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   146
reg_def XMM4b( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   147
reg_def XMM4c( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   148
reg_def XMM4d( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   149
reg_def XMM4e( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   150
reg_def XMM4f( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   151
reg_def XMM4g( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   152
reg_def XMM4h( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   153
reg_def XMM4i( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   154
reg_def XMM4j( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   155
reg_def XMM4k( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   156
reg_def XMM4l( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   157
reg_def XMM4m( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   158
reg_def XMM4n( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   159
reg_def XMM4o( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   160
reg_def XMM4p( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   161
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   162
reg_def XMM5 ( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   163
reg_def XMM5b( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   164
reg_def XMM5c( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   165
reg_def XMM5d( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   166
reg_def XMM5e( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   167
reg_def XMM5f( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   168
reg_def XMM5g( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   169
reg_def XMM5h( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   170
reg_def XMM5i( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   171
reg_def XMM5j( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   172
reg_def XMM5k( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   173
reg_def XMM5l( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   174
reg_def XMM5m( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   175
reg_def XMM5n( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   176
reg_def XMM5o( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   177
reg_def XMM5p( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   178
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   179
reg_def XMM6 ( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   180
reg_def XMM6b( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   181
reg_def XMM6c( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   182
reg_def XMM6d( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   183
reg_def XMM6e( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   184
reg_def XMM6f( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   185
reg_def XMM6g( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   186
reg_def XMM6h( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   187
reg_def XMM6i( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   188
reg_def XMM6j( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   189
reg_def XMM6k( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   190
reg_def XMM6l( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   191
reg_def XMM6m( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   192
reg_def XMM6n( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   193
reg_def XMM6o( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   194
reg_def XMM6p( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   195
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   196
reg_def XMM7 ( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   197
reg_def XMM7b( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   198
reg_def XMM7c( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   199
reg_def XMM7d( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   200
reg_def XMM7e( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   201
reg_def XMM7f( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   202
reg_def XMM7g( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   203
reg_def XMM7h( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   204
reg_def XMM7i( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   205
reg_def XMM7j( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   206
reg_def XMM7k( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   207
reg_def XMM7l( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   208
reg_def XMM7m( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   209
reg_def XMM7n( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   210
reg_def XMM7o( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   211
reg_def XMM7p( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   212
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   213
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   214
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   215
reg_def XMM8 ( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   216
reg_def XMM8b( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   217
reg_def XMM8c( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   218
reg_def XMM8d( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   219
reg_def XMM8e( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   220
reg_def XMM8f( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   221
reg_def XMM8g( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   222
reg_def XMM8h( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   223
reg_def XMM8i( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   224
reg_def XMM8j( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   225
reg_def XMM8k( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   226
reg_def XMM8l( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   227
reg_def XMM8m( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   228
reg_def XMM8n( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   229
reg_def XMM8o( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   230
reg_def XMM8p( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   231
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   232
reg_def XMM9 ( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   233
reg_def XMM9b( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   234
reg_def XMM9c( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   235
reg_def XMM9d( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   236
reg_def XMM9e( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   237
reg_def XMM9f( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   238
reg_def XMM9g( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   239
reg_def XMM9h( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   240
reg_def XMM9i( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   241
reg_def XMM9j( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   242
reg_def XMM9k( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   243
reg_def XMM9l( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   244
reg_def XMM9m( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   245
reg_def XMM9n( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   246
reg_def XMM9o( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   247
reg_def XMM9p( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   248
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   249
reg_def XMM10 ( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   250
reg_def XMM10b( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   251
reg_def XMM10c( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   252
reg_def XMM10d( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   253
reg_def XMM10e( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   254
reg_def XMM10f( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   255
reg_def XMM10g( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   256
reg_def XMM10h( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   257
reg_def XMM10i( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   258
reg_def XMM10j( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   259
reg_def XMM10k( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   260
reg_def XMM10l( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   261
reg_def XMM10m( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   262
reg_def XMM10n( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   263
reg_def XMM10o( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   264
reg_def XMM10p( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   265
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   266
reg_def XMM11 ( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   267
reg_def XMM11b( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   268
reg_def XMM11c( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   269
reg_def XMM11d( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   270
reg_def XMM11e( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   271
reg_def XMM11f( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   272
reg_def XMM11g( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   273
reg_def XMM11h( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   274
reg_def XMM11i( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   275
reg_def XMM11j( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   276
reg_def XMM11k( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   277
reg_def XMM11l( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   278
reg_def XMM11m( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   279
reg_def XMM11n( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   280
reg_def XMM11o( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   281
reg_def XMM11p( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   282
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   283
reg_def XMM12 ( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   284
reg_def XMM12b( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   285
reg_def XMM12c( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   286
reg_def XMM12d( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   287
reg_def XMM12e( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   288
reg_def XMM12f( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   289
reg_def XMM12g( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   290
reg_def XMM12h( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   291
reg_def XMM12i( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   292
reg_def XMM12j( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   293
reg_def XMM12k( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   294
reg_def XMM12l( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   295
reg_def XMM12m( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   296
reg_def XMM12n( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   297
reg_def XMM12o( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   298
reg_def XMM12p( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   299
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   300
reg_def XMM13 ( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   301
reg_def XMM13b( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   302
reg_def XMM13c( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   303
reg_def XMM13d( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   304
reg_def XMM13e( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   305
reg_def XMM13f( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   306
reg_def XMM13g( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   307
reg_def XMM13h( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   308
reg_def XMM13i( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   309
reg_def XMM13j( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   310
reg_def XMM13k( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   311
reg_def XMM13l( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   312
reg_def XMM13m( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   313
reg_def XMM13n( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   314
reg_def XMM13o( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   315
reg_def XMM13p( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   316
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   317
reg_def XMM14 ( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   318
reg_def XMM14b( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   319
reg_def XMM14c( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   320
reg_def XMM14d( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   321
reg_def XMM14e( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   322
reg_def XMM14f( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   323
reg_def XMM14g( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   324
reg_def XMM14h( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   325
reg_def XMM14i( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   326
reg_def XMM14j( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   327
reg_def XMM14k( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   328
reg_def XMM14l( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   329
reg_def XMM14m( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   330
reg_def XMM14n( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   331
reg_def XMM14o( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   332
reg_def XMM14p( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   333
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   334
reg_def XMM15 ( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   335
reg_def XMM15b( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   336
reg_def XMM15c( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   337
reg_def XMM15d( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   338
reg_def XMM15e( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   339
reg_def XMM15f( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   340
reg_def XMM15g( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   341
reg_def XMM15h( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   342
reg_def XMM15i( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   343
reg_def XMM15j( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   344
reg_def XMM15k( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   345
reg_def XMM15l( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   346
reg_def XMM15m( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   347
reg_def XMM15n( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   348
reg_def XMM15o( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   349
reg_def XMM15p( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   350
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   351
reg_def XMM16 ( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   352
reg_def XMM16b( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   353
reg_def XMM16c( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   354
reg_def XMM16d( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   355
reg_def XMM16e( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   356
reg_def XMM16f( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   357
reg_def XMM16g( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   358
reg_def XMM16h( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   359
reg_def XMM16i( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   360
reg_def XMM16j( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   361
reg_def XMM16k( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   362
reg_def XMM16l( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   363
reg_def XMM16m( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   364
reg_def XMM16n( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   365
reg_def XMM16o( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   366
reg_def XMM16p( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   367
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   368
reg_def XMM17 ( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   369
reg_def XMM17b( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   370
reg_def XMM17c( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   371
reg_def XMM17d( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   372
reg_def XMM17e( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   373
reg_def XMM17f( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   374
reg_def XMM17g( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   375
reg_def XMM17h( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   376
reg_def XMM17i( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   377
reg_def XMM17j( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   378
reg_def XMM17k( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   379
reg_def XMM17l( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   380
reg_def XMM17m( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   381
reg_def XMM17n( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   382
reg_def XMM17o( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   383
reg_def XMM17p( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   384
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   385
reg_def XMM18 ( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   386
reg_def XMM18b( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   387
reg_def XMM18c( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   388
reg_def XMM18d( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   389
reg_def XMM18e( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   390
reg_def XMM18f( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   391
reg_def XMM18g( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   392
reg_def XMM18h( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   393
reg_def XMM18i( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   394
reg_def XMM18j( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   395
reg_def XMM18k( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   396
reg_def XMM18l( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   397
reg_def XMM18m( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   398
reg_def XMM18n( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   399
reg_def XMM18o( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   400
reg_def XMM18p( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   401
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   402
reg_def XMM19 ( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   403
reg_def XMM19b( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   404
reg_def XMM19c( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   405
reg_def XMM19d( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   406
reg_def XMM19e( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   407
reg_def XMM19f( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   408
reg_def XMM19g( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   409
reg_def XMM19h( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   410
reg_def XMM19i( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   411
reg_def XMM19j( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   412
reg_def XMM19k( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   413
reg_def XMM19l( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   414
reg_def XMM19m( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   415
reg_def XMM19n( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   416
reg_def XMM19o( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   417
reg_def XMM19p( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   418
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   419
reg_def XMM20 ( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   420
reg_def XMM20b( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   421
reg_def XMM20c( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   422
reg_def XMM20d( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   423
reg_def XMM20e( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   424
reg_def XMM20f( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   425
reg_def XMM20g( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   426
reg_def XMM20h( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   427
reg_def XMM20i( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   428
reg_def XMM20j( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   429
reg_def XMM20k( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   430
reg_def XMM20l( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   431
reg_def XMM20m( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   432
reg_def XMM20n( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   433
reg_def XMM20o( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   434
reg_def XMM20p( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   435
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   436
reg_def XMM21 ( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   437
reg_def XMM21b( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   438
reg_def XMM21c( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   439
reg_def XMM21d( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   440
reg_def XMM21e( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   441
reg_def XMM21f( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   442
reg_def XMM21g( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   443
reg_def XMM21h( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   444
reg_def XMM21i( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   445
reg_def XMM21j( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   446
reg_def XMM21k( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   447
reg_def XMM21l( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   448
reg_def XMM21m( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   449
reg_def XMM21n( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   450
reg_def XMM21o( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   451
reg_def XMM21p( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   452
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   453
reg_def XMM22 ( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   454
reg_def XMM22b( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   455
reg_def XMM22c( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   456
reg_def XMM22d( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   457
reg_def XMM22e( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   458
reg_def XMM22f( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   459
reg_def XMM22g( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   460
reg_def XMM22h( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   461
reg_def XMM22i( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   462
reg_def XMM22j( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   463
reg_def XMM22k( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   464
reg_def XMM22l( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   465
reg_def XMM22m( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   466
reg_def XMM22n( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   467
reg_def XMM22o( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   468
reg_def XMM22p( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   469
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   470
reg_def XMM23 ( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   471
reg_def XMM23b( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   472
reg_def XMM23c( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   473
reg_def XMM23d( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   474
reg_def XMM23e( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   475
reg_def XMM23f( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   476
reg_def XMM23g( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   477
reg_def XMM23h( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   478
reg_def XMM23i( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   479
reg_def XMM23j( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   480
reg_def XMM23k( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   481
reg_def XMM23l( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   482
reg_def XMM23m( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   483
reg_def XMM23n( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   484
reg_def XMM23o( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   485
reg_def XMM23p( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   486
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   487
reg_def XMM24 ( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   488
reg_def XMM24b( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   489
reg_def XMM24c( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   490
reg_def XMM24d( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   491
reg_def XMM24e( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   492
reg_def XMM24f( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   493
reg_def XMM24g( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   494
reg_def XMM24h( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   495
reg_def XMM24i( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   496
reg_def XMM24j( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   497
reg_def XMM24k( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   498
reg_def XMM24l( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   499
reg_def XMM24m( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   500
reg_def XMM24n( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   501
reg_def XMM24o( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   502
reg_def XMM24p( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   503
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   504
reg_def XMM25 ( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   505
reg_def XMM25b( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   506
reg_def XMM25c( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   507
reg_def XMM25d( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   508
reg_def XMM25e( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   509
reg_def XMM25f( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   510
reg_def XMM25g( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   511
reg_def XMM25h( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   512
reg_def XMM25i( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   513
reg_def XMM25j( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   514
reg_def XMM25k( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   515
reg_def XMM25l( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   516
reg_def XMM25m( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   517
reg_def XMM25n( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   518
reg_def XMM25o( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   519
reg_def XMM25p( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   520
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   521
reg_def XMM26 ( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   522
reg_def XMM26b( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   523
reg_def XMM26c( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   524
reg_def XMM26d( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   525
reg_def XMM26e( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   526
reg_def XMM26f( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   527
reg_def XMM26g( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   528
reg_def XMM26h( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   529
reg_def XMM26i( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   530
reg_def XMM26j( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   531
reg_def XMM26k( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   532
reg_def XMM26l( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   533
reg_def XMM26m( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   534
reg_def XMM26n( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   535
reg_def XMM26o( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   536
reg_def XMM26p( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   537
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   538
reg_def XMM27 ( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   539
reg_def XMM27b( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   540
reg_def XMM27c( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   541
reg_def XMM27d( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   542
reg_def XMM27e( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   543
reg_def XMM27f( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   544
reg_def XMM27g( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   545
reg_def XMM27h( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   546
reg_def XMM27i( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   547
reg_def XMM27j( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   548
reg_def XMM27k( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   549
reg_def XMM27l( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   550
reg_def XMM27m( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   551
reg_def XMM27n( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   552
reg_def XMM27o( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   553
reg_def XMM27p( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   554
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   555
reg_def XMM28 ( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   556
reg_def XMM28b( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   557
reg_def XMM28c( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   558
reg_def XMM28d( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   559
reg_def XMM28e( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   560
reg_def XMM28f( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   561
reg_def XMM28g( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   562
reg_def XMM28h( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   563
reg_def XMM28i( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   564
reg_def XMM28j( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   565
reg_def XMM28k( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   566
reg_def XMM28l( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   567
reg_def XMM28m( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   568
reg_def XMM28n( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   569
reg_def XMM28o( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   570
reg_def XMM28p( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   571
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   572
reg_def XMM29 ( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   573
reg_def XMM29b( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   574
reg_def XMM29c( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   575
reg_def XMM29d( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   576
reg_def XMM29e( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   577
reg_def XMM29f( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   578
reg_def XMM29g( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   579
reg_def XMM29h( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   580
reg_def XMM29i( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   581
reg_def XMM29j( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   582
reg_def XMM29k( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   583
reg_def XMM29l( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   584
reg_def XMM29m( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   585
reg_def XMM29n( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   586
reg_def XMM29o( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   587
reg_def XMM29p( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   588
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   589
reg_def XMM30 ( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   590
reg_def XMM30b( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   591
reg_def XMM30c( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   592
reg_def XMM30d( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   593
reg_def XMM30e( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   594
reg_def XMM30f( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   595
reg_def XMM30g( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   596
reg_def XMM30h( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   597
reg_def XMM30i( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   598
reg_def XMM30j( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   599
reg_def XMM30k( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   600
reg_def XMM30l( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   601
reg_def XMM30m( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   602
reg_def XMM30n( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   603
reg_def XMM30o( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   604
reg_def XMM30p( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   605
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   606
reg_def XMM31 ( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   607
reg_def XMM31b( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   608
reg_def XMM31c( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   609
reg_def XMM31d( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   610
reg_def XMM31e( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   611
reg_def XMM31f( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   612
reg_def XMM31g( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   613
reg_def XMM31h( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   614
reg_def XMM31i( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   615
reg_def XMM31j( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   616
reg_def XMM31k( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   617
reg_def XMM31l( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   618
reg_def XMM31m( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   619
reg_def XMM31n( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   620
reg_def XMM31o( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   621
reg_def XMM31p( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   622
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   623
#endif // _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   624
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   625
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   626
reg_def RFLAGS(SOC, SOC, 0, 16, VMRegImpl::Bad());
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   627
#else
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   628
reg_def RFLAGS(SOC, SOC, 0, 8, VMRegImpl::Bad());
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   629
#endif // _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   630
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   631
alloc_class chunk1(XMM0,  XMM0b,  XMM0c,  XMM0d,  XMM0e,  XMM0f,  XMM0g,  XMM0h,  XMM0i,  XMM0j,  XMM0k,  XMM0l,  XMM0m,  XMM0n,  XMM0o,  XMM0p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   632
                   XMM1,  XMM1b,  XMM1c,  XMM1d,  XMM1e,  XMM1f,  XMM1g,  XMM1h,  XMM1i,  XMM1j,  XMM1k,  XMM1l,  XMM1m,  XMM1n,  XMM1o,  XMM1p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   633
                   XMM2,  XMM2b,  XMM2c,  XMM2d,  XMM2e,  XMM2f,  XMM2g,  XMM2h,  XMM2i,  XMM2j,  XMM2k,  XMM2l,  XMM2m,  XMM2n,  XMM2o,  XMM2p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   634
                   XMM3,  XMM3b,  XMM3c,  XMM3d,  XMM3e,  XMM3f,  XMM3g,  XMM3h,  XMM3i,  XMM3j,  XMM3k,  XMM3l,  XMM3m,  XMM3n,  XMM3o,  XMM3p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   635
                   XMM4,  XMM4b,  XMM4c,  XMM4d,  XMM4e,  XMM4f,  XMM4g,  XMM4h,  XMM4i,  XMM4j,  XMM4k,  XMM4l,  XMM4m,  XMM4n,  XMM4o,  XMM4p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   636
                   XMM5,  XMM5b,  XMM5c,  XMM5d,  XMM5e,  XMM5f,  XMM5g,  XMM5h,  XMM5i,  XMM5j,  XMM5k,  XMM5l,  XMM5m,  XMM5n,  XMM5o,  XMM5p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   637
                   XMM6,  XMM6b,  XMM6c,  XMM6d,  XMM6e,  XMM6f,  XMM6g,  XMM6h,  XMM6i,  XMM6j,  XMM6k,  XMM6l,  XMM6m,  XMM6n,  XMM6o,  XMM6p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   638
                   XMM7,  XMM7b,  XMM7c,  XMM7d,  XMM7e,  XMM7f,  XMM7g,  XMM7h,  XMM7i,  XMM7j,  XMM7k,  XMM7l,  XMM7m,  XMM7n,  XMM7o,  XMM7p
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   639
#ifdef _LP64
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   640
                  ,XMM8,  XMM8b,  XMM8c,  XMM8d,  XMM8e,  XMM8f,  XMM8g,  XMM8h,  XMM8i,  XMM8j,  XMM8k,  XMM8l,  XMM8m,  XMM8n,  XMM8o,  XMM8p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   641
                   XMM9,  XMM9b,  XMM9c,  XMM9d,  XMM9e,  XMM9f,  XMM9g,  XMM9h,  XMM9i,  XMM9j,  XMM9k,  XMM9l,  XMM9m,  XMM9n,  XMM9o,  XMM9p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   642
                   XMM10, XMM10b, XMM10c, XMM10d, XMM10e, XMM10f, XMM10g, XMM10h, XMM10i, XMM10j, XMM10k, XMM10l, XMM10m, XMM10n, XMM10o, XMM10p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   643
                   XMM11, XMM11b, XMM11c, XMM11d, XMM11e, XMM11f, XMM11g, XMM11h, XMM11i, XMM11j, XMM11k, XMM11l, XMM11m, XMM11n, XMM11o, XMM11p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   644
                   XMM12, XMM12b, XMM12c, XMM12d, XMM12e, XMM12f, XMM12g, XMM12h, XMM12i, XMM12j, XMM12k, XMM12l, XMM12m, XMM12n, XMM12o, XMM12p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   645
                   XMM13, XMM13b, XMM13c, XMM13d, XMM13e, XMM13f, XMM13g, XMM13h, XMM13i, XMM13j, XMM13k, XMM13l, XMM13m, XMM13n, XMM13o, XMM13p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   646
                   XMM14, XMM14b, XMM14c, XMM14d, XMM14e, XMM14f, XMM14g, XMM14h, XMM14i, XMM14j, XMM14k, XMM14l, XMM14m, XMM14n, XMM14o, XMM14p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   647
                   XMM15, XMM15b, XMM15c, XMM15d, XMM15e, XMM15f, XMM15g, XMM15h, XMM15i, XMM15j, XMM15k, XMM15l, XMM15m, XMM15n, XMM15o, XMM15p
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   648
                  ,XMM16, XMM16b, XMM16c, XMM16d, XMM16e, XMM16f, XMM16g, XMM16h, XMM16i, XMM16j, XMM16k, XMM16l, XMM16m, XMM16n, XMM16o, XMM16p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   649
                   XMM17, XMM17b, XMM17c, XMM17d, XMM17e, XMM17f, XMM17g, XMM17h, XMM17i, XMM17j, XMM17k, XMM17l, XMM17m, XMM17n, XMM17o, XMM17p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   650
                   XMM18, XMM18b, XMM18c, XMM18d, XMM18e, XMM18f, XMM18g, XMM18h, XMM18i, XMM18j, XMM18k, XMM18l, XMM18m, XMM18n, XMM18o, XMM18p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   651
                   XMM19, XMM19b, XMM19c, XMM19d, XMM19e, XMM19f, XMM19g, XMM19h, XMM19i, XMM19j, XMM19k, XMM19l, XMM19m, XMM19n, XMM19o, XMM19p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   652
                   XMM20, XMM20b, XMM20c, XMM20d, XMM20e, XMM20f, XMM20g, XMM20h, XMM20i, XMM20j, XMM20k, XMM20l, XMM20m, XMM20n, XMM20o, XMM20p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   653
                   XMM21, XMM21b, XMM21c, XMM21d, XMM21e, XMM21f, XMM21g, XMM21h, XMM21i, XMM21j, XMM21k, XMM21l, XMM21m, XMM21n, XMM21o, XMM21p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   654
                   XMM22, XMM22b, XMM22c, XMM22d, XMM22e, XMM22f, XMM22g, XMM22h, XMM22i, XMM22j, XMM22k, XMM22l, XMM22m, XMM22n, XMM22o, XMM22p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   655
                   XMM23, XMM23b, XMM23c, XMM23d, XMM23e, XMM23f, XMM23g, XMM23h, XMM23i, XMM23j, XMM23k, XMM23l, XMM23m, XMM23n, XMM23o, XMM23p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   656
                   XMM24, XMM24b, XMM24c, XMM24d, XMM24e, XMM24f, XMM24g, XMM24h, XMM24i, XMM24j, XMM24k, XMM24l, XMM24m, XMM24n, XMM24o, XMM24p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   657
                   XMM25, XMM25b, XMM25c, XMM25d, XMM25e, XMM25f, XMM25g, XMM25h, XMM25i, XMM25j, XMM25k, XMM25l, XMM25m, XMM25n, XMM25o, XMM25p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   658
                   XMM26, XMM26b, XMM26c, XMM26d, XMM26e, XMM26f, XMM26g, XMM26h, XMM26i, XMM26j, XMM26k, XMM26l, XMM26m, XMM26n, XMM26o, XMM26p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   659
                   XMM27, XMM27b, XMM27c, XMM27d, XMM27e, XMM27f, XMM27g, XMM27h, XMM27i, XMM27j, XMM27k, XMM27l, XMM27m, XMM27n, XMM27o, XMM27p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   660
                   XMM28, XMM28b, XMM28c, XMM28d, XMM28e, XMM28f, XMM28g, XMM28h, XMM28i, XMM28j, XMM28k, XMM28l, XMM28m, XMM28n, XMM28o, XMM28p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   661
                   XMM29, XMM29b, XMM29c, XMM29d, XMM29e, XMM29f, XMM29g, XMM29h, XMM29i, XMM29j, XMM29k, XMM29l, XMM29m, XMM29n, XMM29o, XMM29p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   662
                   XMM30, XMM30b, XMM30c, XMM30d, XMM30e, XMM30f, XMM30g, XMM30h, XMM30i, XMM30j, XMM30k, XMM30l, XMM30m, XMM30n, XMM30o, XMM30p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   663
                   XMM31, XMM31b, XMM31c, XMM31d, XMM31e, XMM31f, XMM31g, XMM31h, XMM31i, XMM31j, XMM31k, XMM31l, XMM31m, XMM31n, XMM31o, XMM31p
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   664
#endif
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   665
                      );
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   666
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   667
// flags allocation class should be last.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   668
alloc_class chunk2(RFLAGS);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   669
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   670
// Singleton class for condition codes
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   671
reg_class int_flags(RFLAGS);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   672
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   673
// Class for pre evex float registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   674
reg_class float_reg_legacy(XMM0,
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   675
                    XMM1,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   676
                    XMM2,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   677
                    XMM3,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   678
                    XMM4,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   679
                    XMM5,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   680
                    XMM6,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   681
                    XMM7
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   682
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   683
                   ,XMM8,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   684
                    XMM9,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   685
                    XMM10,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   686
                    XMM11,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   687
                    XMM12,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   688
                    XMM13,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   689
                    XMM14,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   690
                    XMM15
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   691
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   692
                    );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   693
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   694
// Class for evex float registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   695
reg_class float_reg_evex(XMM0,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   696
                    XMM1,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   697
                    XMM2,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   698
                    XMM3,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   699
                    XMM4,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   700
                    XMM5,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   701
                    XMM6,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   702
                    XMM7
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   703
#ifdef _LP64
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   704
                   ,XMM8,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   705
                    XMM9,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   706
                    XMM10,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   707
                    XMM11,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   708
                    XMM12,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   709
                    XMM13,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   710
                    XMM14,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   711
                    XMM15,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   712
                    XMM16,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   713
                    XMM17,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   714
                    XMM18,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   715
                    XMM19,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   716
                    XMM20,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   717
                    XMM21,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   718
                    XMM22,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   719
                    XMM23,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   720
                    XMM24,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   721
                    XMM25,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   722
                    XMM26,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   723
                    XMM27,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   724
                    XMM28,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   725
                    XMM29,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   726
                    XMM30,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   727
                    XMM31
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   728
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   729
                    );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   730
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   731
reg_class_dynamic float_reg(float_reg_evex, float_reg_legacy, %{ VM_Version::supports_evex() %} );
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
   732
reg_class_dynamic float_reg_vl(float_reg_evex, float_reg_legacy, %{ VM_Version::supports_evex() && VM_Version::supports_avx512vl() %} );
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   733
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   734
// Class for pre evex double registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   735
reg_class double_reg_legacy(XMM0,  XMM0b,
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   736
                     XMM1,  XMM1b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   737
                     XMM2,  XMM2b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   738
                     XMM3,  XMM3b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   739
                     XMM4,  XMM4b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   740
                     XMM5,  XMM5b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   741
                     XMM6,  XMM6b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   742
                     XMM7,  XMM7b
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   743
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   744
                    ,XMM8,  XMM8b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   745
                     XMM9,  XMM9b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   746
                     XMM10, XMM10b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   747
                     XMM11, XMM11b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   748
                     XMM12, XMM12b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   749
                     XMM13, XMM13b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   750
                     XMM14, XMM14b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   751
                     XMM15, XMM15b
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   752
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   753
                     );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   754
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   755
// Class for evex double registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   756
reg_class double_reg_evex(XMM0,  XMM0b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   757
                     XMM1,  XMM1b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   758
                     XMM2,  XMM2b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   759
                     XMM3,  XMM3b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   760
                     XMM4,  XMM4b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   761
                     XMM5,  XMM5b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   762
                     XMM6,  XMM6b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   763
                     XMM7,  XMM7b
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   764
#ifdef _LP64
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   765
                    ,XMM8,  XMM8b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   766
                     XMM9,  XMM9b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   767
                     XMM10, XMM10b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   768
                     XMM11, XMM11b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   769
                     XMM12, XMM12b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   770
                     XMM13, XMM13b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   771
                     XMM14, XMM14b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   772
                     XMM15, XMM15b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   773
                     XMM16, XMM16b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   774
                     XMM17, XMM17b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   775
                     XMM18, XMM18b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   776
                     XMM19, XMM19b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   777
                     XMM20, XMM20b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   778
                     XMM21, XMM21b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   779
                     XMM22, XMM22b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   780
                     XMM23, XMM23b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   781
                     XMM24, XMM24b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   782
                     XMM25, XMM25b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   783
                     XMM26, XMM26b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   784
                     XMM27, XMM27b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   785
                     XMM28, XMM28b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   786
                     XMM29, XMM29b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   787
                     XMM30, XMM30b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   788
                     XMM31, XMM31b
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   789
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   790
                     );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   791
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   792
reg_class_dynamic double_reg(double_reg_evex, double_reg_legacy, %{ VM_Version::supports_evex() %} );
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
   793
reg_class_dynamic double_reg_vl(double_reg_evex, double_reg_legacy, %{ VM_Version::supports_evex() && VM_Version::supports_avx512vl() %} );
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   794
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   795
// Class for pre evex 32bit vector registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   796
reg_class vectors_reg_legacy(XMM0,
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   797
                      XMM1,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   798
                      XMM2,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   799
                      XMM3,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   800
                      XMM4,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   801
                      XMM5,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   802
                      XMM6,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   803
                      XMM7
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   804
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   805
                     ,XMM8,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   806
                      XMM9,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   807
                      XMM10,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   808
                      XMM11,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   809
                      XMM12,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   810
                      XMM13,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   811
                      XMM14,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   812
                      XMM15
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   813
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   814
                      );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   815
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   816
// Class for evex 32bit vector registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   817
reg_class vectors_reg_evex(XMM0,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   818
                      XMM1,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   819
                      XMM2,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   820
                      XMM3,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   821
                      XMM4,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   822
                      XMM5,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   823
                      XMM6,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   824
                      XMM7
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   825
#ifdef _LP64
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   826
                     ,XMM8,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   827
                      XMM9,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   828
                      XMM10,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   829
                      XMM11,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   830
                      XMM12,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   831
                      XMM13,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   832
                      XMM14,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   833
                      XMM15,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   834
                      XMM16,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   835
                      XMM17,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   836
                      XMM18,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   837
                      XMM19,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   838
                      XMM20,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   839
                      XMM21,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   840
                      XMM22,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   841
                      XMM23,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   842
                      XMM24,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   843
                      XMM25,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   844
                      XMM26,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   845
                      XMM27,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   846
                      XMM28,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   847
                      XMM29,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   848
                      XMM30,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   849
                      XMM31
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   850
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   851
                      );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   852
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   853
reg_class_dynamic vectors_reg(vectors_reg_evex, vectors_reg_legacy, %{ VM_Version::supports_evex() %} );
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
   854
reg_class_dynamic vectors_reg_vlbwdq(vectors_reg_evex, vectors_reg_legacy, %{ VM_Version::supports_avx512vlbwdq() %} );
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   855
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   856
// Class for all 64bit vector registers
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   857
reg_class vectord_reg_legacy(XMM0,  XMM0b,
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   858
                      XMM1,  XMM1b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   859
                      XMM2,  XMM2b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   860
                      XMM3,  XMM3b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   861
                      XMM4,  XMM4b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   862
                      XMM5,  XMM5b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   863
                      XMM6,  XMM6b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   864
                      XMM7,  XMM7b
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   865
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   866
                     ,XMM8,  XMM8b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   867
                      XMM9,  XMM9b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   868
                      XMM10, XMM10b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   869
                      XMM11, XMM11b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   870
                      XMM12, XMM12b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   871
                      XMM13, XMM13b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   872
                      XMM14, XMM14b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   873
                      XMM15, XMM15b
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   874
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   875
                      );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   876
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   877
// Class for all 64bit vector registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   878
reg_class vectord_reg_evex(XMM0,  XMM0b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   879
                      XMM1,  XMM1b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   880
                      XMM2,  XMM2b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   881
                      XMM3,  XMM3b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   882
                      XMM4,  XMM4b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   883
                      XMM5,  XMM5b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   884
                      XMM6,  XMM6b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   885
                      XMM7,  XMM7b
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   886
#ifdef _LP64
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   887
                     ,XMM8,  XMM8b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   888
                      XMM9,  XMM9b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   889
                      XMM10, XMM10b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   890
                      XMM11, XMM11b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   891
                      XMM12, XMM12b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   892
                      XMM13, XMM13b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   893
                      XMM14, XMM14b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   894
                      XMM15, XMM15b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   895
                      XMM16, XMM16b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   896
                      XMM17, XMM17b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   897
                      XMM18, XMM18b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   898
                      XMM19, XMM19b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   899
                      XMM20, XMM20b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   900
                      XMM21, XMM21b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   901
                      XMM22, XMM22b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   902
                      XMM23, XMM23b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   903
                      XMM24, XMM24b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   904
                      XMM25, XMM25b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   905
                      XMM26, XMM26b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   906
                      XMM27, XMM27b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   907
                      XMM28, XMM28b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   908
                      XMM29, XMM29b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   909
                      XMM30, XMM30b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   910
                      XMM31, XMM31b
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   911
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   912
                      );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   913
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   914
reg_class_dynamic vectord_reg(vectord_reg_evex, vectord_reg_legacy, %{ VM_Version::supports_evex() %} );
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
   915
reg_class_dynamic vectord_reg_vlbwdq(vectord_reg_evex, vectord_reg_legacy, %{ VM_Version::supports_avx512vlbwdq() %} );
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   916
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   917
// Class for all 128bit vector registers
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   918
reg_class vectorx_reg_legacy(XMM0,  XMM0b,  XMM0c,  XMM0d,
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   919
                      XMM1,  XMM1b,  XMM1c,  XMM1d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   920
                      XMM2,  XMM2b,  XMM2c,  XMM2d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   921
                      XMM3,  XMM3b,  XMM3c,  XMM3d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   922
                      XMM4,  XMM4b,  XMM4c,  XMM4d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   923
                      XMM5,  XMM5b,  XMM5c,  XMM5d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   924
                      XMM6,  XMM6b,  XMM6c,  XMM6d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   925
                      XMM7,  XMM7b,  XMM7c,  XMM7d
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   926
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   927
                     ,XMM8,  XMM8b,  XMM8c,  XMM8d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   928
                      XMM9,  XMM9b,  XMM9c,  XMM9d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   929
                      XMM10, XMM10b, XMM10c, XMM10d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   930
                      XMM11, XMM11b, XMM11c, XMM11d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   931
                      XMM12, XMM12b, XMM12c, XMM12d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   932
                      XMM13, XMM13b, XMM13c, XMM13d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   933
                      XMM14, XMM14b, XMM14c, XMM14d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   934
                      XMM15, XMM15b, XMM15c, XMM15d
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   935
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   936
                      );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   937
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   938
// Class for all 128bit vector registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   939
reg_class vectorx_reg_evex(XMM0,  XMM0b,  XMM0c,  XMM0d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   940
                      XMM1,  XMM1b,  XMM1c,  XMM1d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   941
                      XMM2,  XMM2b,  XMM2c,  XMM2d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   942
                      XMM3,  XMM3b,  XMM3c,  XMM3d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   943
                      XMM4,  XMM4b,  XMM4c,  XMM4d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   944
                      XMM5,  XMM5b,  XMM5c,  XMM5d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   945
                      XMM6,  XMM6b,  XMM6c,  XMM6d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   946
                      XMM7,  XMM7b,  XMM7c,  XMM7d
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   947
#ifdef _LP64
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   948
                     ,XMM8,  XMM8b,  XMM8c,  XMM8d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   949
                      XMM9,  XMM9b,  XMM9c,  XMM9d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   950
                      XMM10, XMM10b, XMM10c, XMM10d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   951
                      XMM11, XMM11b, XMM11c, XMM11d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   952
                      XMM12, XMM12b, XMM12c, XMM12d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   953
                      XMM13, XMM13b, XMM13c, XMM13d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   954
                      XMM14, XMM14b, XMM14c, XMM14d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   955
                      XMM15, XMM15b, XMM15c, XMM15d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   956
                      XMM16, XMM16b, XMM16c, XMM16d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   957
                      XMM17, XMM17b, XMM17c, XMM17d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   958
                      XMM18, XMM18b, XMM18c, XMM18d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   959
                      XMM19, XMM19b, XMM19c, XMM19d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   960
                      XMM20, XMM20b, XMM20c, XMM20d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   961
                      XMM21, XMM21b, XMM21c, XMM21d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   962
                      XMM22, XMM22b, XMM22c, XMM22d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   963
                      XMM23, XMM23b, XMM23c, XMM23d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   964
                      XMM24, XMM24b, XMM24c, XMM24d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   965
                      XMM25, XMM25b, XMM25c, XMM25d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   966
                      XMM26, XMM26b, XMM26c, XMM26d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   967
                      XMM27, XMM27b, XMM27c, XMM27d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   968
                      XMM28, XMM28b, XMM28c, XMM28d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   969
                      XMM29, XMM29b, XMM29c, XMM29d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   970
                      XMM30, XMM30b, XMM30c, XMM30d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   971
                      XMM31, XMM31b, XMM31c, XMM31d
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   972
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   973
                      );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   974
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   975
reg_class_dynamic vectorx_reg(vectorx_reg_evex, vectorx_reg_legacy, %{ VM_Version::supports_evex() %} );
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
   976
reg_class_dynamic vectorx_reg_vlbwdq(vectorx_reg_evex, vectorx_reg_legacy, %{ VM_Version::supports_avx512vlbwdq() %} );
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   977
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   978
// Class for all 256bit vector registers
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   979
reg_class vectory_reg_legacy(XMM0,  XMM0b,  XMM0c,  XMM0d,  XMM0e,  XMM0f,  XMM0g,  XMM0h,
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   980
                      XMM1,  XMM1b,  XMM1c,  XMM1d,  XMM1e,  XMM1f,  XMM1g,  XMM1h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   981
                      XMM2,  XMM2b,  XMM2c,  XMM2d,  XMM2e,  XMM2f,  XMM2g,  XMM2h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   982
                      XMM3,  XMM3b,  XMM3c,  XMM3d,  XMM3e,  XMM3f,  XMM3g,  XMM3h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   983
                      XMM4,  XMM4b,  XMM4c,  XMM4d,  XMM4e,  XMM4f,  XMM4g,  XMM4h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   984
                      XMM5,  XMM5b,  XMM5c,  XMM5d,  XMM5e,  XMM5f,  XMM5g,  XMM5h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   985
                      XMM6,  XMM6b,  XMM6c,  XMM6d,  XMM6e,  XMM6f,  XMM6g,  XMM6h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   986
                      XMM7,  XMM7b,  XMM7c,  XMM7d,  XMM7e,  XMM7f,  XMM7g,  XMM7h
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   987
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   988
                     ,XMM8,  XMM8b,  XMM8c,  XMM8d,  XMM8e,  XMM8f,  XMM8g,  XMM8h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   989
                      XMM9,  XMM9b,  XMM9c,  XMM9d,  XMM9e,  XMM9f,  XMM9g,  XMM9h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   990
                      XMM10, XMM10b, XMM10c, XMM10d, XMM10e, XMM10f, XMM10g, XMM10h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   991
                      XMM11, XMM11b, XMM11c, XMM11d, XMM11e, XMM11f, XMM11g, XMM11h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   992
                      XMM12, XMM12b, XMM12c, XMM12d, XMM12e, XMM12f, XMM12g, XMM12h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   993
                      XMM13, XMM13b, XMM13c, XMM13d, XMM13e, XMM13f, XMM13g, XMM13h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   994
                      XMM14, XMM14b, XMM14c, XMM14d, XMM14e, XMM14f, XMM14g, XMM14h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   995
                      XMM15, XMM15b, XMM15c, XMM15d, XMM15e, XMM15f, XMM15g, XMM15h
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   996
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   997
                      );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   998
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   999
// Class for all 256bit vector registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1000
reg_class vectory_reg_evex(XMM0,  XMM0b,  XMM0c,  XMM0d,  XMM0e,  XMM0f,  XMM0g,  XMM0h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1001
                      XMM1,  XMM1b,  XMM1c,  XMM1d,  XMM1e,  XMM1f,  XMM1g,  XMM1h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1002
                      XMM2,  XMM2b,  XMM2c,  XMM2d,  XMM2e,  XMM2f,  XMM2g,  XMM2h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1003
                      XMM3,  XMM3b,  XMM3c,  XMM3d,  XMM3e,  XMM3f,  XMM3g,  XMM3h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1004
                      XMM4,  XMM4b,  XMM4c,  XMM4d,  XMM4e,  XMM4f,  XMM4g,  XMM4h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1005
                      XMM5,  XMM5b,  XMM5c,  XMM5d,  XMM5e,  XMM5f,  XMM5g,  XMM5h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1006
                      XMM6,  XMM6b,  XMM6c,  XMM6d,  XMM6e,  XMM6f,  XMM6g,  XMM6h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1007
                      XMM7,  XMM7b,  XMM7c,  XMM7d,  XMM7e,  XMM7f,  XMM7g,  XMM7h
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1008
#ifdef _LP64
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1009
                     ,XMM8,  XMM8b,  XMM8c,  XMM8d,  XMM8e,  XMM8f,  XMM8g,  XMM8h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1010
                      XMM9,  XMM9b,  XMM9c,  XMM9d,  XMM9e,  XMM9f,  XMM9g,  XMM9h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1011
                      XMM10, XMM10b, XMM10c, XMM10d, XMM10e, XMM10f, XMM10g, XMM10h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1012
                      XMM11, XMM11b, XMM11c, XMM11d, XMM11e, XMM11f, XMM11g, XMM11h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1013
                      XMM12, XMM12b, XMM12c, XMM12d, XMM12e, XMM12f, XMM12g, XMM12h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1014
                      XMM13, XMM13b, XMM13c, XMM13d, XMM13e, XMM13f, XMM13g, XMM13h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1015
                      XMM14, XMM14b, XMM14c, XMM14d, XMM14e, XMM14f, XMM14g, XMM14h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1016
                      XMM15, XMM15b, XMM15c, XMM15d, XMM15e, XMM15f, XMM15g, XMM15h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1017
                      XMM16, XMM16b, XMM16c, XMM16d, XMM16e, XMM16f, XMM16g, XMM16h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1018
                      XMM17, XMM17b, XMM17c, XMM17d, XMM17e, XMM17f, XMM17g, XMM17h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1019
                      XMM18, XMM18b, XMM18c, XMM18d, XMM18e, XMM18f, XMM18g, XMM18h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1020
                      XMM19, XMM19b, XMM19c, XMM19d, XMM19e, XMM19f, XMM19g, XMM19h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1021
                      XMM20, XMM20b, XMM20c, XMM20d, XMM20e, XMM20f, XMM20g, XMM20h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1022
                      XMM21, XMM21b, XMM21c, XMM21d, XMM21e, XMM21f, XMM21g, XMM21h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1023
                      XMM22, XMM22b, XMM22c, XMM22d, XMM22e, XMM22f, XMM22g, XMM22h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1024
                      XMM23, XMM23b, XMM23c, XMM23d, XMM23e, XMM23f, XMM23g, XMM23h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1025
                      XMM24, XMM24b, XMM24c, XMM24d, XMM24e, XMM24f, XMM24g, XMM24h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1026
                      XMM25, XMM25b, XMM25c, XMM25d, XMM25e, XMM25f, XMM25g, XMM25h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1027
                      XMM26, XMM26b, XMM26c, XMM26d, XMM26e, XMM26f, XMM26g, XMM26h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1028
                      XMM27, XMM27b, XMM27c, XMM27d, XMM27e, XMM27f, XMM27g, XMM27h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1029
                      XMM28, XMM28b, XMM28c, XMM28d, XMM28e, XMM28f, XMM28g, XMM28h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1030
                      XMM29, XMM29b, XMM29c, XMM29d, XMM29e, XMM29f, XMM29g, XMM29h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1031
                      XMM30, XMM30b, XMM30c, XMM30d, XMM30e, XMM30f, XMM30g, XMM30h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1032
                      XMM31, XMM31b, XMM31c, XMM31d, XMM31e, XMM31f, XMM31g, XMM31h
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1033
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1034
                      );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1035
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1036
reg_class_dynamic vectory_reg(vectory_reg_evex, vectory_reg_legacy, %{ VM_Version::supports_evex() %} );
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1037
reg_class_dynamic vectory_reg_vlbwdq(vectory_reg_evex, vectory_reg_legacy, %{ VM_Version::supports_avx512vlbwdq() %} );
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1038
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1039
// Class for all 512bit vector registers
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1040
reg_class vectorz_reg_evex(XMM0,  XMM0b,  XMM0c,  XMM0d,  XMM0e,  XMM0f,  XMM0g,  XMM0h,  XMM0i,  XMM0j,  XMM0k,  XMM0l,  XMM0m,  XMM0n,  XMM0o,  XMM0p,
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1041
                      XMM1,  XMM1b,  XMM1c,  XMM1d,  XMM1e,  XMM1f,  XMM1g,  XMM1h,  XMM1i,  XMM1j,  XMM1k,  XMM1l,  XMM1m,  XMM1n,  XMM1o,  XMM1p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1042
                      XMM2,  XMM2b,  XMM2c,  XMM2d,  XMM2e,  XMM2f,  XMM2g,  XMM2h,  XMM2i,  XMM2j,  XMM2k,  XMM2l,  XMM2m,  XMM2n,  XMM2o,  XMM2p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1043
                      XMM3,  XMM3b,  XMM3c,  XMM3d,  XMM3e,  XMM3f,  XMM3g,  XMM3h,  XMM3i,  XMM3j,  XMM3k,  XMM3l,  XMM3m,  XMM3n,  XMM3o,  XMM3p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1044
                      XMM4,  XMM4b,  XMM4c,  XMM4d,  XMM4e,  XMM4f,  XMM4g,  XMM4h,  XMM4i,  XMM4j,  XMM4k,  XMM4l,  XMM4m,  XMM4n,  XMM4o,  XMM4p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1045
                      XMM5,  XMM5b,  XMM5c,  XMM5d,  XMM5e,  XMM5f,  XMM5g,  XMM5h,  XMM5i,  XMM5j,  XMM5k,  XMM5l,  XMM5m,  XMM5n,  XMM5o,  XMM5p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1046
                      XMM6,  XMM6b,  XMM6c,  XMM6d,  XMM6e,  XMM6f,  XMM6g,  XMM6h,  XMM6i,  XMM6j,  XMM6k,  XMM6l,  XMM6m,  XMM6n,  XMM6o,  XMM6p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1047
                      XMM7,  XMM7b,  XMM7c,  XMM7d,  XMM7e,  XMM7f,  XMM7g,  XMM7h,  XMM7i,  XMM7j,  XMM7k,  XMM7l,  XMM7m,  XMM7n,  XMM7o,  XMM7p
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1048
#ifdef _LP64
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1049
                     ,XMM8,  XMM8b,  XMM8c,  XMM8d,  XMM8e,  XMM8f,  XMM8g,  XMM8h,  XMM8i,  XMM8j,  XMM8k,  XMM8l,  XMM8m,  XMM8n,  XMM8o,  XMM8p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1050
                      XMM9,  XMM9b,  XMM9c,  XMM9d,  XMM9e,  XMM9f,  XMM9g,  XMM9h,  XMM9i,  XMM9j,  XMM9k,  XMM9l,  XMM9m,  XMM9n,  XMM9o,  XMM9p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1051
                      XMM10, XMM10b, XMM10c, XMM10d, XMM10e, XMM10f, XMM10g, XMM10h, XMM10i, XMM10j, XMM10k, XMM10l, XMM10m, XMM10n, XMM10o, XMM10p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1052
                      XMM11, XMM11b, XMM11c, XMM11d, XMM11e, XMM11f, XMM11g, XMM11h, XMM11i, XMM11j, XMM11k, XMM11l, XMM11m, XMM11n, XMM11o, XMM11p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1053
                      XMM12, XMM12b, XMM12c, XMM12d, XMM12e, XMM12f, XMM12g, XMM12h, XMM12i, XMM12j, XMM12k, XMM12l, XMM12m, XMM12n, XMM12o, XMM12p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1054
                      XMM13, XMM13b, XMM13c, XMM13d, XMM13e, XMM13f, XMM13g, XMM13h, XMM13i, XMM13j, XMM13k, XMM13l, XMM13m, XMM13n, XMM13o, XMM13p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1055
                      XMM14, XMM14b, XMM14c, XMM14d, XMM14e, XMM14f, XMM14g, XMM14h, XMM14i, XMM14j, XMM14k, XMM14l, XMM14m, XMM14n, XMM14o, XMM14p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1056
                      XMM15, XMM15b, XMM15c, XMM15d, XMM15e, XMM15f, XMM15g, XMM15h, XMM15i, XMM15j, XMM15k, XMM15l, XMM15m, XMM15n, XMM15o, XMM15p
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1057
                     ,XMM16, XMM16b, XMM16c, XMM16d, XMM16e, XMM16f, XMM16g, XMM16h, XMM16i, XMM16j, XMM16k, XMM16l, XMM16m, XMM16n, XMM16o, XMM16p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1058
                      XMM17, XMM17b, XMM17c, XMM17d, XMM17e, XMM17f, XMM17g, XMM17h, XMM17i, XMM17j, XMM17k, XMM17l, XMM17m, XMM17n, XMM17o, XMM17p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1059
                      XMM18, XMM18b, XMM18c, XMM18d, XMM18e, XMM18f, XMM18g, XMM18h, XMM18i, XMM18j, XMM18k, XMM18l, XMM18m, XMM18n, XMM18o, XMM18p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1060
                      XMM19, XMM19b, XMM19c, XMM19d, XMM19e, XMM19f, XMM19g, XMM19h, XMM19i, XMM19j, XMM19k, XMM19l, XMM19m, XMM19n, XMM19o, XMM19p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1061
                      XMM20, XMM20b, XMM20c, XMM20d, XMM20e, XMM20f, XMM20g, XMM20h, XMM20i, XMM20j, XMM20k, XMM20l, XMM20m, XMM20n, XMM20o, XMM20p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1062
                      XMM21, XMM21b, XMM21c, XMM21d, XMM21e, XMM21f, XMM21g, XMM21h, XMM21i, XMM21j, XMM21k, XMM21l, XMM21m, XMM21n, XMM21o, XMM21p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1063
                      XMM22, XMM22b, XMM22c, XMM22d, XMM22e, XMM22f, XMM22g, XMM22h, XMM22i, XMM22j, XMM22k, XMM22l, XMM22m, XMM22n, XMM22o, XMM22p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1064
                      XMM23, XMM23b, XMM23c, XMM23d, XMM23e, XMM23f, XMM23g, XMM23h, XMM23i, XMM23j, XMM23k, XMM23l, XMM23m, XMM23n, XMM23o, XMM23p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1065
                      XMM24, XMM24b, XMM24c, XMM24d, XMM24e, XMM24f, XMM24g, XMM24h, XMM24i, XMM24j, XMM24k, XMM24l, XMM24m, XMM24n, XMM24o, XMM24p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1066
                      XMM25, XMM25b, XMM25c, XMM25d, XMM25e, XMM25f, XMM25g, XMM25h, XMM25i, XMM25j, XMM25k, XMM25l, XMM25m, XMM25n, XMM25o, XMM25p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1067
                      XMM26, XMM26b, XMM26c, XMM26d, XMM26e, XMM26f, XMM26g, XMM26h, XMM26i, XMM26j, XMM26k, XMM26l, XMM26m, XMM26n, XMM26o, XMM26p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1068
                      XMM27, XMM27b, XMM27c, XMM27d, XMM27e, XMM27f, XMM27g, XMM27h, XMM27i, XMM27j, XMM27k, XMM27l, XMM27m, XMM27n, XMM27o, XMM27p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1069
                      XMM28, XMM28b, XMM28c, XMM28d, XMM28e, XMM28f, XMM28g, XMM28h, XMM28i, XMM28j, XMM28k, XMM28l, XMM28m, XMM28n, XMM28o, XMM28p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1070
                      XMM29, XMM29b, XMM29c, XMM29d, XMM29e, XMM29f, XMM29g, XMM29h, XMM29i, XMM29j, XMM29k, XMM29l, XMM29m, XMM29n, XMM29o, XMM29p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1071
                      XMM30, XMM30b, XMM30c, XMM30d, XMM30e, XMM30f, XMM30g, XMM30h, XMM30i, XMM30j, XMM30k, XMM30l, XMM30m, XMM30n, XMM30o, XMM30p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1072
                      XMM31, XMM31b, XMM31c, XMM31d, XMM31e, XMM31f, XMM31g, XMM31h, XMM31i, XMM31j, XMM31k, XMM31l, XMM31m, XMM31n, XMM31o, XMM31p
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1073
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1074
                      );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1075
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1076
// Class for restricted 512bit vector registers
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1077
reg_class vectorz_reg_legacy(XMM0,  XMM0b,  XMM0c,  XMM0d,  XMM0e,  XMM0f,  XMM0g,  XMM0h,  XMM0i,  XMM0j,  XMM0k,  XMM0l,  XMM0m,  XMM0n,  XMM0o,  XMM0p,
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1078
                      XMM1,  XMM1b,  XMM1c,  XMM1d,  XMM1e,  XMM1f,  XMM1g,  XMM1h,  XMM1i,  XMM1j,  XMM1k,  XMM1l,  XMM1m,  XMM1n,  XMM1o,  XMM1p,
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1079
                      XMM2,  XMM2b,  XMM2c,  XMM2d,  XMM2e,  XMM2f,  XMM2g,  XMM2h,  XMM2i,  XMM2j,  XMM2k,  XMM2l,  XMM2m,  XMM2n,  XMM2o,  XMM2p,
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1080
                      XMM3,  XMM3b,  XMM3c,  XMM3d,  XMM3e,  XMM3f,  XMM3g,  XMM3h,  XMM3i,  XMM3j,  XMM3k,  XMM3l,  XMM3m,  XMM3n,  XMM3o,  XMM3p,
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1081
                      XMM4,  XMM4b,  XMM4c,  XMM4d,  XMM4e,  XMM4f,  XMM4g,  XMM4h,  XMM4i,  XMM4j,  XMM4k,  XMM4l,  XMM4m,  XMM4n,  XMM4o,  XMM4p,
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1082
                      XMM5,  XMM5b,  XMM5c,  XMM5d,  XMM5e,  XMM5f,  XMM5g,  XMM5h,  XMM5i,  XMM5j,  XMM5k,  XMM5l,  XMM5m,  XMM5n,  XMM5o,  XMM5p,
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1083
                      XMM6,  XMM6b,  XMM6c,  XMM6d,  XMM6e,  XMM6f,  XMM6g,  XMM6h,  XMM6i,  XMM6j,  XMM6k,  XMM6l,  XMM6m,  XMM6n,  XMM6o,  XMM6p,
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1084
                      XMM7,  XMM7b,  XMM7c,  XMM7d,  XMM7e,  XMM7f,  XMM7g,  XMM7h,  XMM7i,  XMM7j,  XMM7k,  XMM7l,  XMM7m,  XMM7n,  XMM7o,  XMM7p
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1085
#ifdef _LP64
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1086
                     ,XMM8,  XMM8b,  XMM8c,  XMM8d,  XMM8e,  XMM8f,  XMM8g,  XMM8h,  XMM8i,  XMM8j,  XMM8k,  XMM8l,  XMM8m,  XMM8n,  XMM8o,  XMM8p,
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1087
                      XMM9,  XMM9b,  XMM9c,  XMM9d,  XMM9e,  XMM9f,  XMM9g,  XMM9h,  XMM9i,  XMM9j,  XMM9k,  XMM9l,  XMM9m,  XMM9n,  XMM9o,  XMM9p,
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1088
                      XMM10, XMM10b, XMM10c, XMM10d, XMM10e, XMM10f, XMM10g, XMM10h, XMM10i, XMM10j, XMM10k, XMM10l, XMM10m, XMM10n, XMM10o, XMM10p,
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1089
                      XMM11, XMM11b, XMM11c, XMM11d, XMM11e, XMM11f, XMM11g, XMM11h, XMM11i, XMM11j, XMM11k, XMM11l, XMM11m, XMM11n, XMM11o, XMM11p,
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1090
                      XMM12, XMM12b, XMM12c, XMM12d, XMM12e, XMM12f, XMM12g, XMM12h, XMM12i, XMM12j, XMM12k, XMM12l, XMM12m, XMM12n, XMM12o, XMM12p,
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1091
                      XMM13, XMM13b, XMM13c, XMM13d, XMM13e, XMM13f, XMM13g, XMM13h, XMM13i, XMM13j, XMM13k, XMM13l, XMM13m, XMM13n, XMM13o, XMM13p,
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1092
                      XMM14, XMM14b, XMM14c, XMM14d, XMM14e, XMM14f, XMM14g, XMM14h, XMM14i, XMM14j, XMM14k, XMM14l, XMM14m, XMM14n, XMM14o, XMM14p,
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1093
                      XMM15, XMM15b, XMM15c, XMM15d, XMM15e, XMM15f, XMM15g, XMM15h, XMM15i, XMM15j, XMM15k, XMM15l, XMM15m, XMM15n, XMM15o, XMM15p
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1094
#endif
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1095
                      );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1096
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1097
reg_class_dynamic vectorz_reg(vectorz_reg_evex, vectorz_reg_legacy, %{ VM_Version::supports_evex() %} );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1098
reg_class_dynamic vectorz_reg_vl(vectorz_reg_evex, vectorz_reg_legacy, %{ VM_Version::supports_evex() && VM_Version::supports_avx512vl() %} );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1099
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1100
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1101
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1102
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1103
//----------SOURCE BLOCK-------------------------------------------------------
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1104
// This is a block of C++ code which provides values, functions, and
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1105
// definitions necessary in the rest of the architecture description
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1106
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1107
source_hpp %{
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1108
// Header information of the source block.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1109
// Method declarations/definitions which are used outside
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1110
// the ad-scope can conveniently be defined here.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1111
//
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1112
// To keep related declarations/definitions/uses close together,
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1113
// we switch between source %{ }% and source_hpp %{ }% freely as needed.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1114
25715
d5a8dbdc5150 8049325: Introduce and clean up umbrella headers for the files in the cpu subdirectories.
goetz
parents: 23498
diff changeset
  1115
class NativeJump;
d5a8dbdc5150 8049325: Introduce and clean up umbrella headers for the files in the cpu subdirectories.
goetz
parents: 23498
diff changeset
  1116
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1117
class CallStubImpl {
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1118
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1119
  //--------------------------------------------------------------
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1120
  //---<  Used for optimization in Compile::shorten_branches  >---
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1121
  //--------------------------------------------------------------
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1122
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1123
 public:
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1124
  // Size of call trampoline stub.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1125
  static uint size_call_trampoline() {
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1126
    return 0; // no call trampolines on this platform
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1127
  }
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1128
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1129
  // number of relocations needed by a call trampoline stub
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1130
  static uint reloc_call_trampoline() {
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1131
    return 0; // no call trampolines on this platform
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1132
  }
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1133
};
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1134
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1135
class HandlerImpl {
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1136
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1137
 public:
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1138
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1139
  static int emit_exception_handler(CodeBuffer &cbuf);
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1140
  static int emit_deopt_handler(CodeBuffer& cbuf);
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1141
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1142
  static uint size_exception_handler() {
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1143
    // NativeCall instruction size is the same as NativeJump.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1144
    // exception handler starts out as jump and can be patched to
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1145
    // a call be deoptimization.  (4932387)
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1146
    // Note that this value is also credited (in output.cpp) to
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1147
    // the size of the code section.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1148
    return NativeJump::instruction_size;
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1149
  }
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1150
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1151
#ifdef _LP64
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1152
  static uint size_deopt_handler() {
51633
21154cb84d2a 8209594: guarantee(this->is8bit(imm8)) failed: Short forward jump exceeds 8-bit offset
kvn
parents: 51078
diff changeset
  1153
    // three 5 byte instructions plus one move for unreachable address.
21154cb84d2a 8209594: guarantee(this->is8bit(imm8)) failed: Short forward jump exceeds 8-bit offset
kvn
parents: 51078
diff changeset
  1154
    return 15+3;
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1155
  }
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1156
#else
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1157
  static uint size_deopt_handler() {
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1158
    // NativeCall instruction size is the same as NativeJump.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1159
    // exception handler starts out as jump and can be patched to
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1160
    // a call be deoptimization.  (4932387)
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1161
    // Note that this value is also credited (in output.cpp) to
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1162
    // the size of the code section.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1163
    return 5 + NativeJump::instruction_size; // pushl(); jmp;
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1164
  }
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1165
#endif
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1166
};
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1167
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1168
%} // end source_hpp
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1169
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1170
source %{
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1171
38286
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1172
#include "opto/addnode.hpp"
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1173
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1174
// Emit exception handler code.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1175
// Stuff framesize into a register and call a VM stub routine.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1176
int HandlerImpl::emit_exception_handler(CodeBuffer& cbuf) {
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1177
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1178
  // Note that the code buffer's insts_mark is always relative to insts.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1179
  // That's why we must use the macroassembler to generate a handler.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1180
  MacroAssembler _masm(&cbuf);
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1181
  address base = __ start_a_stub(size_exception_handler());
32082
2a3323e25de1 8130309: Need to bailout cleanly if creation of stubs fails when codecache is out of space
thartmann
parents: 31410
diff changeset
  1182
  if (base == NULL) {
2a3323e25de1 8130309: Need to bailout cleanly if creation of stubs fails when codecache is out of space
thartmann
parents: 31410
diff changeset
  1183
    ciEnv::current()->record_failure("CodeCache is full");
2a3323e25de1 8130309: Need to bailout cleanly if creation of stubs fails when codecache is out of space
thartmann
parents: 31410
diff changeset
  1184
    return 0;  // CodeBuffer::expand failed
2a3323e25de1 8130309: Need to bailout cleanly if creation of stubs fails when codecache is out of space
thartmann
parents: 31410
diff changeset
  1185
  }
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1186
  int offset = __ offset();
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1187
  __ jump(RuntimeAddress(OptoRuntime::exception_blob()->entry_point()));
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1188
  assert(__ offset() - offset <= (int) size_exception_handler(), "overflow");
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1189
  __ end_a_stub();
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1190
  return offset;
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1191
}
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1192
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1193
// Emit deopt handler code.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1194
int HandlerImpl::emit_deopt_handler(CodeBuffer& cbuf) {
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1195
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1196
  // Note that the code buffer's insts_mark is always relative to insts.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1197
  // That's why we must use the macroassembler to generate a handler.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1198
  MacroAssembler _masm(&cbuf);
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1199
  address base = __ start_a_stub(size_deopt_handler());
32082
2a3323e25de1 8130309: Need to bailout cleanly if creation of stubs fails when codecache is out of space
thartmann
parents: 31410
diff changeset
  1200
  if (base == NULL) {
2a3323e25de1 8130309: Need to bailout cleanly if creation of stubs fails when codecache is out of space
thartmann
parents: 31410
diff changeset
  1201
    ciEnv::current()->record_failure("CodeCache is full");
2a3323e25de1 8130309: Need to bailout cleanly if creation of stubs fails when codecache is out of space
thartmann
parents: 31410
diff changeset
  1202
    return 0;  // CodeBuffer::expand failed
2a3323e25de1 8130309: Need to bailout cleanly if creation of stubs fails when codecache is out of space
thartmann
parents: 31410
diff changeset
  1203
  }
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1204
  int offset = __ offset();
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1205
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1206
#ifdef _LP64
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1207
  address the_pc = (address) __ pc();
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1208
  Label next;
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1209
  // push a "the_pc" on the stack without destroying any registers
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1210
  // as they all may be live.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1211
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1212
  // push address of "next"
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1213
  __ call(next, relocInfo::none); // reloc none is fine since it is a disp32
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1214
  __ bind(next);
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1215
  // adjust it so it matches "the_pc"
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1216
  __ subptr(Address(rsp, 0), __ offset() - offset);
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1217
#else
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1218
  InternalAddress here(__ pc());
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1219
  __ pushptr(here.addr());
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1220
#endif
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1221
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1222
  __ jump(RuntimeAddress(SharedRuntime::deopt_blob()->unpack()));
51633
21154cb84d2a 8209594: guarantee(this->is8bit(imm8)) failed: Short forward jump exceeds 8-bit offset
kvn
parents: 51078
diff changeset
  1223
  assert(__ offset() - offset <= (int) size_deopt_handler(), "overflow %d", (__ offset() - offset));
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1224
  __ end_a_stub();
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1225
  return offset;
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1226
}
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1227
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1228
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1229
//=============================================================================
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1230
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1231
  // Float masks come from different places depending on platform.
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1232
#ifdef _LP64
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1233
  static address float_signmask()  { return StubRoutines::x86::float_sign_mask(); }
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1234
  static address float_signflip()  { return StubRoutines::x86::float_sign_flip(); }
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1235
  static address double_signmask() { return StubRoutines::x86::double_sign_mask(); }
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1236
  static address double_signflip() { return StubRoutines::x86::double_sign_flip(); }
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1237
#else
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1238
  static address float_signmask()  { return (address)float_signmask_pool; }
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1239
  static address float_signflip()  { return (address)float_signflip_pool; }
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1240
  static address double_signmask() { return (address)double_signmask_pool; }
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1241
  static address double_signflip() { return (address)double_signflip_pool; }
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1242
#endif
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1243
  static address vector_short_to_byte_mask() { return StubRoutines::x86::vector_short_to_byte_mask(); }
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1244
  static address vector_byte_perm_mask() { return StubRoutines::x86::vector_byte_perm_mask(); }
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1245
  static address vector_long_sign_mask() { return StubRoutines::x86::vector_long_sign_mask(); }
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1246
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1247
//=============================================================================
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1248
const bool Matcher::match_rule_supported(int opcode) {
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1249
  if (!has_match_rule(opcode))
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1250
    return false;
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1251
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1252
  bool ret_value = true;
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1253
  switch (opcode) {
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1254
    case Op_AbsVL:
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1255
      if (UseAVX < 3)
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1256
        ret_value = false;
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1257
    case Op_PopCountI:
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1258
    case Op_PopCountL:
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1259
      if (!UsePopCountInstruction)
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1260
        ret_value = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1261
      break;
49384
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  1262
    case Op_PopCountVI:
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  1263
      if (!UsePopCountInstruction || !VM_Version::supports_vpopcntdq())
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  1264
        ret_value = false;
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  1265
      break;
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1266
    case Op_MulVI:
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1267
      if ((UseSSE < 4) && (UseAVX < 1)) // only with SSE4_1 or AVX
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1268
        ret_value = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1269
      break;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1270
    case Op_MulVL:
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1271
    case Op_MulReductionVL:
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1272
      if (VM_Version::supports_avx512dq() == false)
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1273
        ret_value = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1274
      break;
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1275
    case Op_AddReductionVL:
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1276
      if (UseAVX < 3) // only EVEX : vector connectivity becomes an issue here
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1277
        ret_value = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1278
      break;
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1279
    case Op_AbsVB:
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1280
    case Op_AbsVS:
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1281
    case Op_AbsVI:
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1282
    case Op_AddReductionVI:
58643
b381e5328461 8232106: [x86] C2: SIGILL due to usage of SSSE3 instructions on processors which don't support it
mdoerr
parents: 58516
diff changeset
  1283
      if (UseSSE < 3 || !VM_Version::supports_ssse3()) // requires at least SSSE3
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1284
        ret_value = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1285
      break;
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1286
    case Op_MulReductionVI:
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1287
      if (UseSSE < 4) // requires at least SSE4
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1288
        ret_value = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1289
      break;
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1290
    case Op_AddReductionVF:
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1291
    case Op_AddReductionVD:
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1292
    case Op_MulReductionVF:
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1293
    case Op_MulReductionVD:
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1294
      if (UseSSE < 1) // requires at least SSE
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1295
        ret_value = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1296
      break;
32723
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  1297
    case Op_SqrtVD:
48089
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  1298
    case Op_SqrtVF:
32723
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  1299
      if (UseAVX < 1) // enabled for AVX only
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1300
        ret_value = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1301
      break;
13886
8d82c4dfa722 7023898: Intrinsify AtomicLongFieldUpdater.getAndIncrement()
roland
parents: 13883
diff changeset
  1302
    case Op_CompareAndSwapL:
8d82c4dfa722 7023898: Intrinsify AtomicLongFieldUpdater.getAndIncrement()
roland
parents: 13883
diff changeset
  1303
#ifdef _LP64
8d82c4dfa722 7023898: Intrinsify AtomicLongFieldUpdater.getAndIncrement()
roland
parents: 13883
diff changeset
  1304
    case Op_CompareAndSwapP:
8d82c4dfa722 7023898: Intrinsify AtomicLongFieldUpdater.getAndIncrement()
roland
parents: 13883
diff changeset
  1305
#endif
8d82c4dfa722 7023898: Intrinsify AtomicLongFieldUpdater.getAndIncrement()
roland
parents: 13883
diff changeset
  1306
      if (!VM_Version::supports_cx8())
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1307
        ret_value = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1308
      break;
48309
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  1309
    case Op_CMoveVF:
33469
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1310
    case Op_CMoveVD:
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1311
      if (UseAVX < 1 || UseAVX > 2)
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1312
        ret_value = false;
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1313
      break;
35581
dd47cf4734f2 8145336: PPC64: fix string intrinsics after CompactStrings change
simonis
parents: 34162
diff changeset
  1314
    case Op_StrIndexOf:
dd47cf4734f2 8145336: PPC64: fix string intrinsics after CompactStrings change
simonis
parents: 34162
diff changeset
  1315
      if (!UseSSE42Intrinsics)
dd47cf4734f2 8145336: PPC64: fix string intrinsics after CompactStrings change
simonis
parents: 34162
diff changeset
  1316
        ret_value = false;
dd47cf4734f2 8145336: PPC64: fix string intrinsics after CompactStrings change
simonis
parents: 34162
diff changeset
  1317
      break;
dd47cf4734f2 8145336: PPC64: fix string intrinsics after CompactStrings change
simonis
parents: 34162
diff changeset
  1318
    case Op_StrIndexOfChar:
39253
bd5fe208734e 8157842: indexOfChar intrinsic is not emitted on x86
thartmann
parents: 38286
diff changeset
  1319
      if (!UseSSE42Intrinsics)
35581
dd47cf4734f2 8145336: PPC64: fix string intrinsics after CompactStrings change
simonis
parents: 34162
diff changeset
  1320
        ret_value = false;
dd47cf4734f2 8145336: PPC64: fix string intrinsics after CompactStrings change
simonis
parents: 34162
diff changeset
  1321
      break;
38017
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  1322
    case Op_OnSpinWait:
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  1323
      if (VM_Version::supports_on_spin_wait() == false)
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  1324
        ret_value = false;
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  1325
      break;
52992
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  1326
    case Op_MulAddVS2VI:
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1327
    case Op_RShiftVL:
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1328
    case Op_AbsVD:
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1329
    case Op_NegVD:
52992
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  1330
      if (UseSSE < 2)
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  1331
        ret_value = false;
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  1332
      break;
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1333
    case Op_MulVB:
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1334
    case Op_LShiftVB:
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1335
    case Op_RShiftVB:
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1336
    case Op_URShiftVB:
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1337
      if (UseSSE < 4)
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1338
        ret_value = false;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1339
      break;
54022
ff399127078a 8217561: X86: Add floating-point Math.min/max intrinsics
bsrbnd
parents: 53639
diff changeset
  1340
#ifdef _LP64
ff399127078a 8217561: X86: Add floating-point Math.min/max intrinsics
bsrbnd
parents: 53639
diff changeset
  1341
    case Op_MaxD:
ff399127078a 8217561: X86: Add floating-point Math.min/max intrinsics
bsrbnd
parents: 53639
diff changeset
  1342
    case Op_MaxF:
ff399127078a 8217561: X86: Add floating-point Math.min/max intrinsics
bsrbnd
parents: 53639
diff changeset
  1343
    case Op_MinD:
ff399127078a 8217561: X86: Add floating-point Math.min/max intrinsics
bsrbnd
parents: 53639
diff changeset
  1344
    case Op_MinF:
ff399127078a 8217561: X86: Add floating-point Math.min/max intrinsics
bsrbnd
parents: 53639
diff changeset
  1345
      if (UseAVX < 1) // enabled for AVX only
ff399127078a 8217561: X86: Add floating-point Math.min/max intrinsics
bsrbnd
parents: 53639
diff changeset
  1346
        ret_value = false;
ff399127078a 8217561: X86: Add floating-point Math.min/max intrinsics
bsrbnd
parents: 53639
diff changeset
  1347
      break;
ff399127078a 8217561: X86: Add floating-point Math.min/max intrinsics
bsrbnd
parents: 53639
diff changeset
  1348
#endif
57804
9b7b9f16dfd9 8224974: Implement JEP 352
adinn
parents: 55299
diff changeset
  1349
    case Op_CacheWB:
9b7b9f16dfd9 8224974: Implement JEP 352
adinn
parents: 55299
diff changeset
  1350
    case Op_CacheWBPreSync:
9b7b9f16dfd9 8224974: Implement JEP 352
adinn
parents: 55299
diff changeset
  1351
    case Op_CacheWBPostSync:
9b7b9f16dfd9 8224974: Implement JEP 352
adinn
parents: 55299
diff changeset
  1352
      if (!VM_Version::supports_data_cache_line_flush()) {
9b7b9f16dfd9 8224974: Implement JEP 352
adinn
parents: 55299
diff changeset
  1353
        ret_value = false;
9b7b9f16dfd9 8224974: Implement JEP 352
adinn
parents: 55299
diff changeset
  1354
      }
9b7b9f16dfd9 8224974: Implement JEP 352
adinn
parents: 55299
diff changeset
  1355
      break;
58421
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  1356
    case Op_RoundDoubleMode:
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  1357
      if (UseSSE < 4)
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  1358
         ret_value = false;
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  1359
      break;
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1360
  }
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1361
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1362
  return ret_value;  // Per default match rules are supported.
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1363
}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1364
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1365
const bool Matcher::match_rule_supported_vector(int opcode, int vlen) {
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1366
  // identify extra cases that we might want to provide match rules for
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1367
  // e.g. Op_ vector nodes and other intrinsics while guarding with vlen
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1368
  bool ret_value = match_rule_supported(opcode);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1369
  if (ret_value) {
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1370
    switch (opcode) {
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1371
      case Op_AbsVB:
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1372
      case Op_AddVB:
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1373
      case Op_SubVB:
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1374
        if ((vlen == 64) && (VM_Version::supports_avx512bw() == false))
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1375
          ret_value = false;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1376
        break;
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1377
      case Op_AbsVS:
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1378
      case Op_AddVS:
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1379
      case Op_SubVS:
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1380
      case Op_MulVS:
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1381
      case Op_LShiftVS:
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1382
      case Op_RShiftVS:
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1383
      case Op_URShiftVS:
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1384
        if ((vlen == 32) && (VM_Version::supports_avx512bw() == false))
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1385
          ret_value = false;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1386
        break;
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1387
      case Op_MulVB:
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1388
      case Op_LShiftVB:
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1389
      case Op_RShiftVB:
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1390
      case Op_URShiftVB:
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1391
        if ((vlen == 32 && UseAVX < 2) || 
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1392
            ((vlen == 64) && (VM_Version::supports_avx512bw() == false)))
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1393
          ret_value = false;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1394
        break;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1395
      case Op_NegVF:
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1396
        if ((vlen == 16) && (VM_Version::supports_avx512dq() == false))
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1397
          ret_value = false;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1398
        break;
48309
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  1399
      case Op_CMoveVF:
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  1400
        if (vlen != 8)
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  1401
          ret_value  = false;
51078
fc6cfe40e32a 8207049: Minor improvements of compiler code.
goetz
parents: 50525
diff changeset
  1402
        break;
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1403
      case Op_NegVD:
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1404
        if ((vlen == 8) && (VM_Version::supports_avx512dq() == false))
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1405
          ret_value = false;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  1406
        break;
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1407
      case Op_CMoveVD:
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1408
        if (vlen != 4)
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1409
          ret_value  = false;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1410
        break;
58421
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  1411
      case Op_RoundDoubleModeV:
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  1412
        if (VM_Version::supports_avx() == false)
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  1413
          ret_value = false;
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  1414
        break;
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1415
    }
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1416
  }
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1417
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1418
  return ret_value;  // Per default match rules are supported.
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1419
}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1420
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1421
const bool Matcher::has_predicated_vectors(void) {
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1422
  bool ret_value = false;
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1423
  if (UseAVX > 2) {
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1424
    ret_value = VM_Version::supports_avx512vl();
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1425
  }
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1426
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1427
  return ret_value;
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1428
}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1429
33065
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1430
const int Matcher::float_pressure(int default_pressure_threshold) {
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1431
  int float_pressure_threshold = default_pressure_threshold;
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1432
#ifdef _LP64
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1433
  if (UseAVX > 2) {
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1434
    // Increase pressure threshold on machines with AVX3 which have
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1435
    // 2x more XMM registers.
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1436
    float_pressure_threshold = default_pressure_threshold * 2;
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1437
  }
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1438
#endif
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1439
  return float_pressure_threshold;
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1440
}
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1441
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1442
// Max vector size in bytes. 0 if not supported.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1443
const int Matcher::vector_width_in_bytes(BasicType bt) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1444
  assert(is_java_primitive(bt), "only primitive type vectors");
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1445
  if (UseSSE < 2) return 0;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1446
  // SSE2 supports 128bit vectors for all types.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1447
  // AVX2 supports 256bit vectors for all types.
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1448
  // AVX2/EVEX supports 512bit vectors for all types.
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1449
  int size = (UseAVX > 1) ? (1 << UseAVX) * 8 : 16;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1450
  // AVX1 supports 256bit vectors only for FLOAT and DOUBLE.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1451
  if (UseAVX > 0 && (bt == T_FLOAT || bt == T_DOUBLE))
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1452
    size = (UseAVX > 2) ? 64 : 32;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1453
  if (UseAVX > 2 && (bt == T_BYTE || bt == T_SHORT || bt == T_CHAR))
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1454
    size = (VM_Version::supports_avx512bw()) ? 64 : 32;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1455
  // Use flag to limit vector size.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1456
  size = MIN2(size,(int)MaxVectorSize);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1457
  // Minimum 2 values in vector (or 4 for bytes).
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1458
  switch (bt) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1459
  case T_DOUBLE:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1460
  case T_LONG:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1461
    if (size < 16) return 0;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1462
    break;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1463
  case T_FLOAT:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1464
  case T_INT:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1465
    if (size < 8) return 0;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1466
    break;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1467
  case T_BOOLEAN:
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1468
    if (size < 4) return 0;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1469
    break;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1470
  case T_CHAR:
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1471
    if (size < 4) return 0;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1472
    break;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1473
  case T_BYTE:
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1474
    if (size < 4) return 0;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1475
    break;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1476
  case T_SHORT:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1477
    if (size < 4) return 0;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1478
    break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1479
  default:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1480
    ShouldNotReachHere();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1481
  }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1482
  return size;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1483
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1484
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1485
// Limits on vector size (number of elements) loaded into vector.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1486
const int Matcher::max_vector_size(const BasicType bt) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1487
  return vector_width_in_bytes(bt)/type2aelembytes(bt);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1488
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1489
const int Matcher::min_vector_size(const BasicType bt) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1490
  int max_size = max_vector_size(bt);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1491
  // Min size which can be loaded into vector is 4 bytes.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1492
  int size = (type2aelembytes(bt) == 1) ? 4 : 2;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1493
  return MIN2(size,max_size);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1494
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1495
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1496
// Vector ideal reg corresponding to specified size in bytes
46378
4ccca1fdf627 8160748: Inconsistent types for ideal_reg
kbarrett
parents: 42039
diff changeset
  1497
const uint Matcher::vector_ideal_reg(int size) {
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1498
  assert(MaxVectorSize >= size, "");
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1499
  switch(size) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1500
    case  4: return Op_VecS;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1501
    case  8: return Op_VecD;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1502
    case 16: return Op_VecX;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1503
    case 32: return Op_VecY;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1504
    case 64: return Op_VecZ;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1505
  }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1506
  ShouldNotReachHere();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1507
  return 0;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1508
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1509
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  1510
// Only lowest bits of xmm reg are used for vector shift count.
46378
4ccca1fdf627 8160748: Inconsistent types for ideal_reg
kbarrett
parents: 42039
diff changeset
  1511
const uint Matcher::vector_shift_count_ideal_reg(int size) {
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  1512
  return Op_VecS;
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  1513
}
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  1514
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1515
// x86 supports misaligned vectors store/load.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1516
const bool Matcher::misaligned_vectors_ok() {
53639
da7dc9e92d91 8215483: Off heap memory accesses should be vectorized
roland
parents: 53580
diff changeset
  1517
  return true;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1518
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1519
22505
4523090c9674 8002074: Support for AES on SPARC
kvn
parents: 14131
diff changeset
  1520
// x86 AES instructions are compatible with SunJCE expanded
4523090c9674 8002074: Support for AES on SPARC
kvn
parents: 14131
diff changeset
  1521
// keys, hence we do not need to pass the original key to stubs
4523090c9674 8002074: Support for AES on SPARC
kvn
parents: 14131
diff changeset
  1522
const bool Matcher::pass_original_key_for_aes() {
4523090c9674 8002074: Support for AES on SPARC
kvn
parents: 14131
diff changeset
  1523
  return false;
4523090c9674 8002074: Support for AES on SPARC
kvn
parents: 14131
diff changeset
  1524
}
4523090c9674 8002074: Support for AES on SPARC
kvn
parents: 14131
diff changeset
  1525
38286
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1526
38236
510f77046e00 8154943: AArch64: redundant address computation instructions with vectorization
roland
parents: 38049
diff changeset
  1527
const bool Matcher::convi2l_type_required = true;
510f77046e00 8154943: AArch64: redundant address computation instructions with vectorization
roland
parents: 38049
diff changeset
  1528
38286
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1529
// Check for shift by small constant as well
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1530
static bool clone_shift(Node* shift, Matcher* matcher, Matcher::MStack& mstack, VectorSet& address_visited) {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1531
  if (shift->Opcode() == Op_LShiftX && shift->in(2)->is_Con() &&
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1532
      shift->in(2)->get_int() <= 3 &&
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1533
      // Are there other uses besides address expressions?
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1534
      !matcher->is_visited(shift)) {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1535
    address_visited.set(shift->_idx); // Flag as address_visited
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1536
    mstack.push(shift->in(2), Matcher::Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1537
    Node *conv = shift->in(1);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1538
#ifdef _LP64
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1539
    // Allow Matcher to match the rule which bypass
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1540
    // ConvI2L operation for an array index on LP64
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1541
    // if the index value is positive.
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1542
    if (conv->Opcode() == Op_ConvI2L &&
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1543
        conv->as_Type()->type()->is_long()->_lo >= 0 &&
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1544
        // Are there other uses besides address expressions?
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1545
        !matcher->is_visited(conv)) {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1546
      address_visited.set(conv->_idx); // Flag as address_visited
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1547
      mstack.push(conv->in(1), Matcher::Pre_Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1548
    } else
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1549
#endif
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1550
      mstack.push(conv, Matcher::Pre_Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1551
    return true;
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1552
  }
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1553
  return false;
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1554
}
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1555
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1556
// Should the Matcher clone shifts on addressing modes, expecting them
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1557
// to be subsumed into complex addressing expressions or compute them
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1558
// into registers?
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1559
bool Matcher::clone_address_expressions(AddPNode* m, Matcher::MStack& mstack, VectorSet& address_visited) {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1560
  Node *off = m->in(AddPNode::Offset);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1561
  if (off->is_Con()) {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1562
    address_visited.test_set(m->_idx); // Flag as address_visited
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1563
    Node *adr = m->in(AddPNode::Address);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1564
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1565
    // Intel can handle 2 adds in addressing mode
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1566
    // AtomicAdd is not an addressing expression.
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1567
    // Cheap to find it by looking for screwy base.
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1568
    if (adr->is_AddP() &&
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1569
        !adr->in(AddPNode::Base)->is_top() &&
53436
80b55cf3a804 8202952: C2: Unexpected dead nodes after matching
vlivanov
parents: 53336
diff changeset
  1570
        LP64_ONLY( off->get_long() == (int) (off->get_long()) && ) // immL32
38286
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1571
        // Are there other uses besides address expressions?
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1572
        !is_visited(adr)) {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1573
      address_visited.set(adr->_idx); // Flag as address_visited
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1574
      Node *shift = adr->in(AddPNode::Offset);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1575
      if (!clone_shift(shift, this, mstack, address_visited)) {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1576
        mstack.push(shift, Pre_Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1577
      }
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1578
      mstack.push(adr->in(AddPNode::Address), Pre_Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1579
      mstack.push(adr->in(AddPNode::Base), Pre_Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1580
    } else {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1581
      mstack.push(adr, Pre_Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1582
    }
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1583
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1584
    // Clone X+offset as it also folds into most addressing expressions
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1585
    mstack.push(off, Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1586
    mstack.push(m->in(AddPNode::Base), Pre_Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1587
    return true;
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1588
  } else if (clone_shift(off, this, mstack, address_visited)) {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1589
    address_visited.test_set(m->_idx); // Flag as address_visited
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1590
    mstack.push(m->in(AddPNode::Address), Pre_Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1591
    mstack.push(m->in(AddPNode::Base), Pre_Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1592
    return true;
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1593
  }
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1594
  return false;
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1595
}
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1596
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1597
void Compile::reshape_address(AddPNode* addp) {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1598
}
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1599
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1600
// Helper methods for MachSpillCopyNode::implementation().
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1601
static int vec_mov_helper(CodeBuffer *cbuf, bool do_size, int src_lo, int dst_lo,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1602
                          int src_hi, int dst_hi, uint ireg, outputStream* st) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1603
  // In 64-bit VM size calculation is very complex. Emitting instructions
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1604
  // into scratch buffer is used to get size in 64-bit VM.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1605
  LP64_ONLY( assert(!do_size, "this method calculates size only for 32-bit VM"); )
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1606
  assert(ireg == Op_VecS || // 32bit vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1607
         (src_lo & 1) == 0 && (src_lo + 1) == src_hi &&
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1608
         (dst_lo & 1) == 0 && (dst_lo + 1) == dst_hi,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1609
         "no non-adjacent vector moves" );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1610
  if (cbuf) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1611
    MacroAssembler _masm(cbuf);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1612
    int offset = __ offset();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1613
    switch (ireg) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1614
    case Op_VecS: // copy whole register
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1615
    case Op_VecD:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1616
    case Op_VecX:
53580
6121eee15c23 8217371: Incorrect LP64 guard in x86.ad after JDK-8210764 (Update avx512 implementation)
sviswanathan
parents: 53436
diff changeset
  1617
#ifndef _LP64
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1618
      __ movdqu(as_XMMRegister(Matcher::_regEncode[dst_lo]), as_XMMRegister(Matcher::_regEncode[src_lo]));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1619
#else
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1620
      if ((UseAVX < 3) || VM_Version::supports_avx512vl()) {
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1621
        __ movdqu(as_XMMRegister(Matcher::_regEncode[dst_lo]), as_XMMRegister(Matcher::_regEncode[src_lo]));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1622
      } else {
53580
6121eee15c23 8217371: Incorrect LP64 guard in x86.ad after JDK-8210764 (Update avx512 implementation)
sviswanathan
parents: 53436
diff changeset
  1623
        __ vextractf32x4(as_XMMRegister(Matcher::_regEncode[dst_lo]), as_XMMRegister(Matcher::_regEncode[src_lo]), 0x0);
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1624
     }
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1625
#endif
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1626
      break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1627
    case Op_VecY:
53580
6121eee15c23 8217371: Incorrect LP64 guard in x86.ad after JDK-8210764 (Update avx512 implementation)
sviswanathan
parents: 53436
diff changeset
  1628
#ifndef _LP64
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1629
      __ vmovdqu(as_XMMRegister(Matcher::_regEncode[dst_lo]), as_XMMRegister(Matcher::_regEncode[src_lo]));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1630
#else
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1631
      if ((UseAVX < 3) || VM_Version::supports_avx512vl()) {
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1632
        __ vmovdqu(as_XMMRegister(Matcher::_regEncode[dst_lo]), as_XMMRegister(Matcher::_regEncode[src_lo]));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1633
      } else {
53580
6121eee15c23 8217371: Incorrect LP64 guard in x86.ad after JDK-8210764 (Update avx512 implementation)
sviswanathan
parents: 53436
diff changeset
  1634
        __ vextractf64x4(as_XMMRegister(Matcher::_regEncode[dst_lo]), as_XMMRegister(Matcher::_regEncode[src_lo]), 0x0);
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1635
     }
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1636
#endif
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1637
      break;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1638
    case Op_VecZ:
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1639
      __ evmovdquq(as_XMMRegister(Matcher::_regEncode[dst_lo]), as_XMMRegister(Matcher::_regEncode[src_lo]), 2);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1640
      break;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1641
    default:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1642
      ShouldNotReachHere();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1643
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1644
    int size = __ offset() - offset;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1645
#ifdef ASSERT
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1646
    // VEX_2bytes prefix is used if UseAVX > 0, so it takes the same 2 bytes as SIMD prefix.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1647
    assert(!do_size || size == 4, "incorrect size calculattion");
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1648
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1649
    return size;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1650
#ifndef PRODUCT
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1651
  } else if (!do_size) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1652
    switch (ireg) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1653
    case Op_VecS:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1654
    case Op_VecD:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1655
    case Op_VecX:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1656
      st->print("movdqu  %s,%s\t# spill",Matcher::regName[dst_lo],Matcher::regName[src_lo]);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1657
      break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1658
    case Op_VecY:
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1659
    case Op_VecZ:
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1660
      st->print("vmovdqu %s,%s\t# spill",Matcher::regName[dst_lo],Matcher::regName[src_lo]);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1661
      break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1662
    default:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1663
      ShouldNotReachHere();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1664
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1665
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1666
  }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1667
  // VEX_2bytes prefix is used if UseAVX > 0, and it takes the same 2 bytes as SIMD prefix.
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1668
  return (UseAVX > 2) ? 6 : 4;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1669
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1670
58516
d376d86b0a01 8230565: ZGC: Redesign C2 load barrier to expand on the MachNode level
eosterlund
parents: 58462
diff changeset
  1671
int vec_spill_helper(CodeBuffer *cbuf, bool do_size, bool is_load,
d376d86b0a01 8230565: ZGC: Redesign C2 load barrier to expand on the MachNode level
eosterlund
parents: 58462
diff changeset
  1672
                     int stack_offset, int reg, uint ireg, outputStream* st) {
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1673
  // In 64-bit VM size calculation is very complex. Emitting instructions
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1674
  // into scratch buffer is used to get size in 64-bit VM.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1675
  LP64_ONLY( assert(!do_size, "this method calculates size only for 32-bit VM"); )
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1676
  if (cbuf) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1677
    MacroAssembler _masm(cbuf);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1678
    int offset = __ offset();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1679
    if (is_load) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1680
      switch (ireg) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1681
      case Op_VecS:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1682
        __ movdl(as_XMMRegister(Matcher::_regEncode[reg]), Address(rsp, stack_offset));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1683
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1684
      case Op_VecD:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1685
        __ movq(as_XMMRegister(Matcher::_regEncode[reg]), Address(rsp, stack_offset));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1686
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1687
      case Op_VecX:
53580
6121eee15c23 8217371: Incorrect LP64 guard in x86.ad after JDK-8210764 (Update avx512 implementation)
sviswanathan
parents: 53436
diff changeset
  1688
#ifndef _LP64
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1689
        __ movdqu(as_XMMRegister(Matcher::_regEncode[reg]), Address(rsp, stack_offset));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1690
#else
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1691
        if ((UseAVX < 3) || VM_Version::supports_avx512vl()) {
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1692
          __ movdqu(as_XMMRegister(Matcher::_regEncode[reg]), Address(rsp, stack_offset));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1693
        } else {
53580
6121eee15c23 8217371: Incorrect LP64 guard in x86.ad after JDK-8210764 (Update avx512 implementation)
sviswanathan
parents: 53436
diff changeset
  1694
          __ vpxor(as_XMMRegister(Matcher::_regEncode[reg]), as_XMMRegister(Matcher::_regEncode[reg]), as_XMMRegister(Matcher::_regEncode[reg]), 2);
6121eee15c23 8217371: Incorrect LP64 guard in x86.ad after JDK-8210764 (Update avx512 implementation)
sviswanathan
parents: 53436
diff changeset
  1695
          __ vinsertf32x4(as_XMMRegister(Matcher::_regEncode[reg]), as_XMMRegister(Matcher::_regEncode[reg]), Address(rsp, stack_offset),0x0);
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1696
        }
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1697
#endif
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1698
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1699
      case Op_VecY:
53580
6121eee15c23 8217371: Incorrect LP64 guard in x86.ad after JDK-8210764 (Update avx512 implementation)
sviswanathan
parents: 53436
diff changeset
  1700
#ifndef _LP64
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1701
        __ vmovdqu(as_XMMRegister(Matcher::_regEncode[reg]), Address(rsp, stack_offset));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1702
#else
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1703
        if ((UseAVX < 3) || VM_Version::supports_avx512vl()) {
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1704
          __ vmovdqu(as_XMMRegister(Matcher::_regEncode[reg]), Address(rsp, stack_offset));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1705
        } else {
53580
6121eee15c23 8217371: Incorrect LP64 guard in x86.ad after JDK-8210764 (Update avx512 implementation)
sviswanathan
parents: 53436
diff changeset
  1706
          __ vpxor(as_XMMRegister(Matcher::_regEncode[reg]), as_XMMRegister(Matcher::_regEncode[reg]), as_XMMRegister(Matcher::_regEncode[reg]), 2);
6121eee15c23 8217371: Incorrect LP64 guard in x86.ad after JDK-8210764 (Update avx512 implementation)
sviswanathan
parents: 53436
diff changeset
  1707
          __ vinsertf64x4(as_XMMRegister(Matcher::_regEncode[reg]), as_XMMRegister(Matcher::_regEncode[reg]), Address(rsp, stack_offset),0x0);
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1708
        }
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1709
#endif
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1710
        break;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1711
      case Op_VecZ:
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1712
        __ evmovdquq(as_XMMRegister(Matcher::_regEncode[reg]), Address(rsp, stack_offset), 2);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1713
        break;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1714
      default:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1715
        ShouldNotReachHere();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1716
      }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1717
    } else { // store
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1718
      switch (ireg) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1719
      case Op_VecS:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1720
        __ movdl(Address(rsp, stack_offset), as_XMMRegister(Matcher::_regEncode[reg]));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1721
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1722
      case Op_VecD:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1723
        __ movq(Address(rsp, stack_offset), as_XMMRegister(Matcher::_regEncode[reg]));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1724
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1725
      case Op_VecX:
53580
6121eee15c23 8217371: Incorrect LP64 guard in x86.ad after JDK-8210764 (Update avx512 implementation)
sviswanathan
parents: 53436
diff changeset
  1726
#ifndef _LP64
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1727
        __ movdqu(Address(rsp, stack_offset), as_XMMRegister(Matcher::_regEncode[reg]));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1728
#else
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1729
        if ((UseAVX < 3) || VM_Version::supports_avx512vl()) {
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1730
          __ movdqu(Address(rsp, stack_offset), as_XMMRegister(Matcher::_regEncode[reg]));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1731
        }
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1732
        else {
53580
6121eee15c23 8217371: Incorrect LP64 guard in x86.ad after JDK-8210764 (Update avx512 implementation)
sviswanathan
parents: 53436
diff changeset
  1733
          __ vextractf32x4(Address(rsp, stack_offset), as_XMMRegister(Matcher::_regEncode[reg]), 0x0);
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1734
        }
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1735
#endif
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1736
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1737
      case Op_VecY:
53580
6121eee15c23 8217371: Incorrect LP64 guard in x86.ad after JDK-8210764 (Update avx512 implementation)
sviswanathan
parents: 53436
diff changeset
  1738
#ifndef _LP64
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1739
        __ vmovdqu(Address(rsp, stack_offset), as_XMMRegister(Matcher::_regEncode[reg]));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1740
#else
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1741
        if ((UseAVX < 3) || VM_Version::supports_avx512vl()) {
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1742
          __ vmovdqu(Address(rsp, stack_offset), as_XMMRegister(Matcher::_regEncode[reg]));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1743
        }
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1744
        else {
53580
6121eee15c23 8217371: Incorrect LP64 guard in x86.ad after JDK-8210764 (Update avx512 implementation)
sviswanathan
parents: 53436
diff changeset
  1745
          __ vextractf64x4(Address(rsp, stack_offset), as_XMMRegister(Matcher::_regEncode[reg]), 0x0);
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1746
        }
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1747
#endif
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1748
        break;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1749
      case Op_VecZ:
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1750
        __ evmovdquq(Address(rsp, stack_offset), as_XMMRegister(Matcher::_regEncode[reg]), 2);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1751
        break;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1752
      default:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1753
        ShouldNotReachHere();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1754
      }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1755
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1756
    int size = __ offset() - offset;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1757
#ifdef ASSERT
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1758
    int offset_size = (stack_offset == 0) ? 0 : ((stack_offset < 0x80) ? 1 : (UseAVX > 2) ? 6 : 4);
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1759
    // VEX_2bytes prefix is used if UseAVX > 0, so it takes the same 2 bytes as SIMD prefix.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1760
    assert(!do_size || size == (5+offset_size), "incorrect size calculattion");
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1761
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1762
    return size;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1763
#ifndef PRODUCT
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1764
  } else if (!do_size) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1765
    if (is_load) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1766
      switch (ireg) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1767
      case Op_VecS:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1768
        st->print("movd    %s,[rsp + %d]\t# spill", Matcher::regName[reg], stack_offset);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1769
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1770
      case Op_VecD:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1771
        st->print("movq    %s,[rsp + %d]\t# spill", Matcher::regName[reg], stack_offset);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1772
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1773
       case Op_VecX:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1774
        st->print("movdqu  %s,[rsp + %d]\t# spill", Matcher::regName[reg], stack_offset);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1775
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1776
      case Op_VecY:
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1777
      case Op_VecZ:
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1778
        st->print("vmovdqu %s,[rsp + %d]\t# spill", Matcher::regName[reg], stack_offset);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1779
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1780
      default:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1781
        ShouldNotReachHere();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1782
      }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1783
    } else { // store
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1784
      switch (ireg) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1785
      case Op_VecS:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1786
        st->print("movd    [rsp + %d],%s\t# spill", stack_offset, Matcher::regName[reg]);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1787
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1788
      case Op_VecD:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1789
        st->print("movq    [rsp + %d],%s\t# spill", stack_offset, Matcher::regName[reg]);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1790
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1791
       case Op_VecX:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1792
        st->print("movdqu  [rsp + %d],%s\t# spill", stack_offset, Matcher::regName[reg]);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1793
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1794
      case Op_VecY:
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1795
      case Op_VecZ:
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1796
        st->print("vmovdqu [rsp + %d],%s\t# spill", stack_offset, Matcher::regName[reg]);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1797
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1798
      default:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1799
        ShouldNotReachHere();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1800
      }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1801
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1802
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1803
  }
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1804
  bool is_single_byte = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1805
  int vec_len = 0;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1806
  if ((UseAVX > 2) && (stack_offset != 0)) {
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1807
    int tuple_type = Assembler::EVEX_FVM;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1808
    int input_size = Assembler::EVEX_32bit;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1809
    switch (ireg) {
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1810
    case Op_VecS:
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1811
      tuple_type = Assembler::EVEX_T1S;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1812
      break;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1813
    case Op_VecD:
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1814
      tuple_type = Assembler::EVEX_T1S;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1815
      input_size = Assembler::EVEX_64bit;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1816
      break;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1817
    case Op_VecX:
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1818
      break;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1819
    case Op_VecY:
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1820
      vec_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1821
      break;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1822
    case Op_VecZ:
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1823
      vec_len = 2;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1824
      break;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1825
    }
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1826
    is_single_byte = Assembler::query_compressed_disp_byte(stack_offset, true, vec_len, tuple_type, input_size, 0);
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1827
  }
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1828
  int offset_size = 0;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1829
  int size = 5;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1830
  if (UseAVX > 2 ) {
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1831
    if (VM_Version::supports_avx512novl() && (vec_len == 2)) {
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1832
      offset_size = (stack_offset == 0) ? 0 : ((is_single_byte) ? 1 : 4);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1833
      size += 2; // Need an additional two bytes for EVEX encoding
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1834
    } else if (VM_Version::supports_avx512novl() && (vec_len < 2)) {
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1835
      offset_size = (stack_offset == 0) ? 0 : ((stack_offset <= 127) ? 1 : 4);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1836
    } else {
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1837
      offset_size = (stack_offset == 0) ? 0 : ((is_single_byte) ? 1 : 4);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1838
      size += 2; // Need an additional two bytes for EVEX encodding
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1839
    }
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1840
  } else {
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1841
    offset_size = (stack_offset == 0) ? 0 : ((stack_offset <= 127) ? 1 : 4);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1842
  }
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1843
  // VEX_2bytes prefix is used if UseAVX > 0, so it takes the same 2 bytes as SIMD prefix.
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1844
  return size+offset_size;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1845
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1846
40040
7644f470d923 8160425: Vectorization with signalling NaN returns wrong result
thartmann
parents: 39253
diff changeset
  1847
static inline jint replicate4_imm(int con, int width) {
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1848
  // Load a constant of "width" (in bytes) and replicate it to fill 32bit.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1849
  assert(width == 1 || width == 2, "only byte or short types here");
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1850
  int bit_width = width * 8;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1851
  jint val = con;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1852
  val &= (1 << bit_width) - 1;  // mask off sign bits
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1853
  while(bit_width < 32) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1854
    val |= (val << bit_width);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1855
    bit_width <<= 1;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1856
  }
40040
7644f470d923 8160425: Vectorization with signalling NaN returns wrong result
thartmann
parents: 39253
diff changeset
  1857
  return val;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1858
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1859
40040
7644f470d923 8160425: Vectorization with signalling NaN returns wrong result
thartmann
parents: 39253
diff changeset
  1860
static inline jlong replicate8_imm(int con, int width) {
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1861
  // Load a constant of "width" (in bytes) and replicate it to fill 64bit.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1862
  assert(width == 1 || width == 2 || width == 4, "only byte, short or int types here");
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1863
  int bit_width = width * 8;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1864
  jlong val = con;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1865
  val &= (((jlong) 1) << bit_width) - 1;  // mask off sign bits
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1866
  while(bit_width < 64) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1867
    val |= (val << bit_width);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1868
    bit_width <<= 1;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1869
  }
40040
7644f470d923 8160425: Vectorization with signalling NaN returns wrong result
thartmann
parents: 39253
diff changeset
  1870
  return val;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1871
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1872
11794
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1873
#ifndef PRODUCT
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1874
  void MachNopNode::format(PhaseRegAlloc*, outputStream* st) const {
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1875
    st->print("nop \t# %d bytes pad for loops and calls", _count);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1876
  }
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1877
#endif
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1878
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1879
  void MachNopNode::emit(CodeBuffer &cbuf, PhaseRegAlloc*) const {
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1880
    MacroAssembler _masm(&cbuf);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1881
    __ nop(_count);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1882
  }
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1883
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1884
  uint MachNopNode::size(PhaseRegAlloc*) const {
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1885
    return _count;
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1886
  }
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1887
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1888
#ifndef PRODUCT
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1889
  void MachBreakpointNode::format(PhaseRegAlloc*, outputStream* st) const {
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1890
    st->print("# breakpoint");
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1891
  }
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1892
#endif
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1893
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1894
  void MachBreakpointNode::emit(CodeBuffer &cbuf, PhaseRegAlloc* ra_) const {
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1895
    MacroAssembler _masm(&cbuf);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1896
    __ int3();
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1897
  }
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1898
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1899
  uint MachBreakpointNode::size(PhaseRegAlloc* ra_) const {
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1900
    return MachNode::size(ra_);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1901
  }
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1902
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1903
%}
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1904
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1905
encode %{
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1906
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1907
  enc_class call_epilog %{
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1908
    if (VerifyStackAtCalls) {
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1909
      // Check that stack depth is unchanged: find majik cookie on stack
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1910
      int framesize = ra_->reg2offset_unchecked(OptoReg::add(ra_->_matcher._old_SP, -3*VMRegImpl::slots_per_word));
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1911
      MacroAssembler _masm(&cbuf);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1912
      Label L;
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1913
      __ cmpptr(Address(rsp, framesize), (int32_t)0xbadb100d);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1914
      __ jccb(Assembler::equal, L);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1915
      // Die if stack mismatch
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1916
      __ int3();
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1917
      __ bind(L);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1918
    }
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1919
  %}
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1920
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1921
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1922
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1923
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1924
//----------OPERANDS-----------------------------------------------------------
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1925
// Operand definitions must precede instruction definitions for correct parsing
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1926
// in the ADLC because operands constitute user defined types which are used in
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1927
// instruction definitions.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1928
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1929
operand vecZ() %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1930
  constraint(ALLOC_IN_RC(vectorz_reg));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1931
  match(VecZ);
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1932
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1933
  format %{ %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1934
  interface(REG_INTER);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1935
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1936
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1937
operand legVecZ() %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1938
  constraint(ALLOC_IN_RC(vectorz_reg_vl));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1939
  match(VecZ);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1940
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1941
  format %{ %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1942
  interface(REG_INTER);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1943
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  1944
33469
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1945
// Comparison Code for FP conditional move
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1946
operand cmpOp_vcmppd() %{
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1947
  match(Bool);
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1948
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1949
  predicate(n->as_Bool()->_test._test != BoolTest::overflow &&
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1950
            n->as_Bool()->_test._test != BoolTest::no_overflow);
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1951
  format %{ "" %}
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1952
  interface(COND_INTER) %{
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1953
    equal        (0x0, "eq");
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1954
    less         (0x1, "lt");
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1955
    less_equal   (0x2, "le");
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1956
    not_equal    (0xC, "ne");
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1957
    greater_equal(0xD, "ge");
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1958
    greater      (0xE, "gt");
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1959
    //TODO cannot compile (adlc breaks) without two next lines with error:
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1960
    // x86_64.ad(13987) Syntax Error: :In operand cmpOp_vcmppd: Do not support this encode constant: ' %{
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1961
    // equal' for overflow.
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1962
    overflow     (0x20, "o");  // not really supported by the instruction
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1963
    no_overflow  (0x21, "no"); // not really supported by the instruction
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1964
  %}
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1965
%}
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1966
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1967
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1968
// INSTRUCTIONS -- Platform independent definitions (same for 32- and 64-bit)
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1969
11794
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1970
// ============================================================================
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1971
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1972
instruct ShouldNotReachHere() %{
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1973
  match(Halt);
46525
3a5c833a43de 8176506: C2: loop unswitching and unsafe accesses cause crash
roland
parents: 46378
diff changeset
  1974
  format %{ "ud2\t# ShouldNotReachHere" %}
3a5c833a43de 8176506: C2: loop unswitching and unsafe accesses cause crash
roland
parents: 46378
diff changeset
  1975
  ins_encode %{
58061
fafba5cf3546 8225653: Provide more information when hitting SIGILL from HaltNode
chagedorn
parents: 57804
diff changeset
  1976
    __ stop(_halt_reason);
11794
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1977
  %}
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1978
  ins_pipe(pipe_slow);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1979
%}
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1980
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1981
// =================================EVEX special===============================
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1982
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1983
instruct setMask(rRegI dst, rRegI src) %{
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1984
  predicate(Matcher::has_predicated_vectors());
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1985
  match(Set dst (SetVectMaskI  src));
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1986
  effect(TEMP dst);
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1987
  format %{ "setvectmask   $dst, $src" %}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1988
  ins_encode %{
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1989
    __ setvectmask($dst$$Register, $src$$Register);
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1990
  %}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1991
  ins_pipe(pipe_slow);
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1992
%}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1993
11794
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1994
// ============================================================================
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1995
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1996
instruct addF_reg(regF dst, regF src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1997
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1998
  match(Set dst (AddF dst src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1999
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2000
  format %{ "addss   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2001
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2002
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2003
    __ addss($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2004
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2005
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2006
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2007
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2008
instruct addF_mem(regF dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2009
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2010
  match(Set dst (AddF dst (LoadF src)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2011
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2012
  format %{ "addss   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2013
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2014
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2015
    __ addss($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2016
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2017
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2018
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2019
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2020
instruct addF_imm(regF dst, immF con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2021
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2022
  match(Set dst (AddF dst con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2023
  format %{ "addss   $dst, [$constantaddress]\t# load from constant table: float=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2024
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2025
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2026
    __ addss($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2027
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2028
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2029
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2030
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2031
instruct addF_reg_reg(regF dst, regF src1, regF src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2032
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2033
  match(Set dst (AddF src1 src2));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2034
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2035
  format %{ "vaddss  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2036
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2037
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2038
    __ vaddss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2039
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2040
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2041
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2042
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2043
instruct addF_reg_mem(regF dst, regF src1, memory src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2044
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2045
  match(Set dst (AddF src1 (LoadF src2)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2046
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2047
  format %{ "vaddss  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2048
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2049
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2050
    __ vaddss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2051
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2052
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2053
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2054
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2055
instruct addF_reg_imm(regF dst, regF src, immF con) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2056
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2057
  match(Set dst (AddF src con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2058
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2059
  format %{ "vaddss  $dst, $src, [$constantaddress]\t# load from constant table: float=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2060
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2061
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2062
    __ vaddss($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2063
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2064
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2065
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2066
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2067
instruct addD_reg(regD dst, regD src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2068
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2069
  match(Set dst (AddD dst src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2070
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2071
  format %{ "addsd   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2072
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2073
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2074
    __ addsd($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2075
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2076
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2077
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2078
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2079
instruct addD_mem(regD dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2080
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2081
  match(Set dst (AddD dst (LoadD src)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2082
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2083
  format %{ "addsd   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2084
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2085
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2086
    __ addsd($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2087
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2088
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2089
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2090
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2091
instruct addD_imm(regD dst, immD con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2092
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2093
  match(Set dst (AddD dst con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2094
  format %{ "addsd   $dst, [$constantaddress]\t# load from constant table: double=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2095
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2096
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2097
    __ addsd($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2098
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2099
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2100
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2101
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2102
instruct addD_reg_reg(regD dst, regD src1, regD src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2103
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2104
  match(Set dst (AddD src1 src2));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2105
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2106
  format %{ "vaddsd  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2107
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2108
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2109
    __ vaddsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2110
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2111
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2112
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2113
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2114
instruct addD_reg_mem(regD dst, regD src1, memory src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2115
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2116
  match(Set dst (AddD src1 (LoadD src2)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2117
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2118
  format %{ "vaddsd  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2119
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2120
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2121
    __ vaddsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2122
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2123
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2124
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2125
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2126
instruct addD_reg_imm(regD dst, regD src, immD con) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2127
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2128
  match(Set dst (AddD src con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2129
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2130
  format %{ "vaddsd  $dst, $src, [$constantaddress]\t# load from constant table: double=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2131
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2132
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2133
    __ vaddsd($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2134
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2135
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2136
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2137
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2138
instruct subF_reg(regF dst, regF src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2139
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2140
  match(Set dst (SubF dst src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2141
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2142
  format %{ "subss   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2143
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2144
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2145
    __ subss($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2146
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2147
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2148
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2149
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2150
instruct subF_mem(regF dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2151
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2152
  match(Set dst (SubF dst (LoadF src)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2153
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2154
  format %{ "subss   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2155
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2156
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2157
    __ subss($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2158
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2159
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2160
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2161
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2162
instruct subF_imm(regF dst, immF con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2163
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2164
  match(Set dst (SubF dst con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2165
  format %{ "subss   $dst, [$constantaddress]\t# load from constant table: float=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2166
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2167
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2168
    __ subss($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2169
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2170
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2171
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2172
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2173
instruct subF_reg_reg(regF dst, regF src1, regF src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2174
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2175
  match(Set dst (SubF src1 src2));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2176
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2177
  format %{ "vsubss  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2178
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2179
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2180
    __ vsubss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2181
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2182
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2183
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2184
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2185
instruct subF_reg_mem(regF dst, regF src1, memory src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2186
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2187
  match(Set dst (SubF src1 (LoadF src2)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2188
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2189
  format %{ "vsubss  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2190
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2191
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2192
    __ vsubss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2193
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2194
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2195
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2196
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2197
instruct subF_reg_imm(regF dst, regF src, immF con) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2198
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2199
  match(Set dst (SubF src con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2200
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2201
  format %{ "vsubss  $dst, $src, [$constantaddress]\t# load from constant table: float=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2202
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2203
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2204
    __ vsubss($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2205
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2206
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2207
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2208
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2209
instruct subD_reg(regD dst, regD src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2210
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2211
  match(Set dst (SubD dst src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2212
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2213
  format %{ "subsd   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2214
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2215
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2216
    __ subsd($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2217
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2218
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2219
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2220
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2221
instruct subD_mem(regD dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2222
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2223
  match(Set dst (SubD dst (LoadD src)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2224
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2225
  format %{ "subsd   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2226
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2227
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2228
    __ subsd($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2229
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2230
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2231
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2232
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2233
instruct subD_imm(regD dst, immD con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2234
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2235
  match(Set dst (SubD dst con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2236
  format %{ "subsd   $dst, [$constantaddress]\t# load from constant table: double=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2237
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2238
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2239
    __ subsd($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2240
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2241
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2242
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2243
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2244
instruct subD_reg_reg(regD dst, regD src1, regD src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2245
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2246
  match(Set dst (SubD src1 src2));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2247
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2248
  format %{ "vsubsd  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2249
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2250
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2251
    __ vsubsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2252
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2253
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2254
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2255
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2256
instruct subD_reg_mem(regD dst, regD src1, memory src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2257
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2258
  match(Set dst (SubD src1 (LoadD src2)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2259
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2260
  format %{ "vsubsd  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2261
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2262
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2263
    __ vsubsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2264
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2265
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2266
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2267
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2268
instruct subD_reg_imm(regD dst, regD src, immD con) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2269
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2270
  match(Set dst (SubD src con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2271
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2272
  format %{ "vsubsd  $dst, $src, [$constantaddress]\t# load from constant table: double=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2273
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2274
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2275
    __ vsubsd($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2276
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2277
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2278
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2279
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2280
instruct mulF_reg(regF dst, regF src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2281
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2282
  match(Set dst (MulF dst src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2283
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2284
  format %{ "mulss   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2285
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2286
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2287
    __ mulss($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2288
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2289
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2290
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2291
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2292
instruct mulF_mem(regF dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2293
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2294
  match(Set dst (MulF dst (LoadF src)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2295
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2296
  format %{ "mulss   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2297
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2298
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2299
    __ mulss($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2300
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2301
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2302
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2303
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2304
instruct mulF_imm(regF dst, immF con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2305
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2306
  match(Set dst (MulF dst con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2307
  format %{ "mulss   $dst, [$constantaddress]\t# load from constant table: float=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2308
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2309
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2310
    __ mulss($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2311
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2312
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2313
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2314
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2315
instruct mulF_reg_reg(regF dst, regF src1, regF src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2316
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2317
  match(Set dst (MulF src1 src2));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2318
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2319
  format %{ "vmulss  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2320
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2321
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2322
    __ vmulss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2323
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2324
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2325
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2326
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2327
instruct mulF_reg_mem(regF dst, regF src1, memory src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2328
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2329
  match(Set dst (MulF src1 (LoadF src2)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2330
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2331
  format %{ "vmulss  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2332
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2333
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2334
    __ vmulss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2335
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2336
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2337
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2338
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2339
instruct mulF_reg_imm(regF dst, regF src, immF con) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2340
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2341
  match(Set dst (MulF src con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2342
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2343
  format %{ "vmulss  $dst, $src, [$constantaddress]\t# load from constant table: float=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2344
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2345
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2346
    __ vmulss($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2347
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2348
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2349
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2350
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2351
instruct mulD_reg(regD dst, regD src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2352
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2353
  match(Set dst (MulD dst src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2354
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2355
  format %{ "mulsd   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2356
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2357
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2358
    __ mulsd($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2359
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2360
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2361
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2362
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2363
instruct mulD_mem(regD dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2364
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2365
  match(Set dst (MulD dst (LoadD src)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2366
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2367
  format %{ "mulsd   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2368
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2369
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2370
    __ mulsd($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2371
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2372
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2373
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2374
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2375
instruct mulD_imm(regD dst, immD con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2376
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2377
  match(Set dst (MulD dst con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2378
  format %{ "mulsd   $dst, [$constantaddress]\t# load from constant table: double=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2379
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2380
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2381
    __ mulsd($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2382
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2383
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2384
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2385
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2386
instruct mulD_reg_reg(regD dst, regD src1, regD src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2387
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2388
  match(Set dst (MulD src1 src2));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2389
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2390
  format %{ "vmulsd  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2391
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2392
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2393
    __ vmulsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2394
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2395
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2396
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2397
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2398
instruct mulD_reg_mem(regD dst, regD src1, memory src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2399
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2400
  match(Set dst (MulD src1 (LoadD src2)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2401
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2402
  format %{ "vmulsd  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2403
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2404
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2405
    __ vmulsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2406
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2407
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2408
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2409
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2410
instruct mulD_reg_imm(regD dst, regD src, immD con) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2411
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2412
  match(Set dst (MulD src con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2413
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2414
  format %{ "vmulsd  $dst, $src, [$constantaddress]\t# load from constant table: double=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2415
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2416
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2417
    __ vmulsd($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2418
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2419
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2420
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2421
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2422
instruct divF_reg(regF dst, regF src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2423
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2424
  match(Set dst (DivF dst src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2425
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2426
  format %{ "divss   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2427
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2428
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2429
    __ divss($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2430
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2431
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2432
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2433
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2434
instruct divF_mem(regF dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2435
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2436
  match(Set dst (DivF dst (LoadF src)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2437
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2438
  format %{ "divss   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2439
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2440
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2441
    __ divss($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2442
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2443
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2444
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2445
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2446
instruct divF_imm(regF dst, immF con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2447
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2448
  match(Set dst (DivF dst con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2449
  format %{ "divss   $dst, [$constantaddress]\t# load from constant table: float=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2450
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2451
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2452
    __ divss($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2453
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2454
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2455
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2456
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2457
instruct divF_reg_reg(regF dst, regF src1, regF src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2458
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2459
  match(Set dst (DivF src1 src2));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2460
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2461
  format %{ "vdivss  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2462
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2463
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2464
    __ vdivss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2465
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2466
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2467
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2468
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2469
instruct divF_reg_mem(regF dst, regF src1, memory src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2470
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2471
  match(Set dst (DivF src1 (LoadF src2)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2472
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2473
  format %{ "vdivss  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2474
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2475
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2476
    __ vdivss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2477
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2478
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2479
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2480
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2481
instruct divF_reg_imm(regF dst, regF src, immF con) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2482
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2483
  match(Set dst (DivF src con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2484
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2485
  format %{ "vdivss  $dst, $src, [$constantaddress]\t# load from constant table: float=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2486
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2487
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2488
    __ vdivss($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2489
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2490
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2491
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2492
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2493
instruct divD_reg(regD dst, regD src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2494
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2495
  match(Set dst (DivD dst src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2496
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2497
  format %{ "divsd   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2498
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2499
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2500
    __ divsd($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2501
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2502
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2503
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2504
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2505
instruct divD_mem(regD dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2506
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2507
  match(Set dst (DivD dst (LoadD src)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2508
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2509
  format %{ "divsd   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2510
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2511
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2512
    __ divsd($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2513
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2514
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2515
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2516
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2517
instruct divD_imm(regD dst, immD con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2518
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2519
  match(Set dst (DivD dst con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2520
  format %{ "divsd   $dst, [$constantaddress]\t# load from constant table: double=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2521
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2522
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2523
    __ divsd($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2524
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2525
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2526
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2527
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2528
instruct divD_reg_reg(regD dst, regD src1, regD src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2529
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2530
  match(Set dst (DivD src1 src2));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2531
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2532
  format %{ "vdivsd  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2533
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2534
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2535
    __ vdivsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2536
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2537
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2538
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2539
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2540
instruct divD_reg_mem(regD dst, regD src1, memory src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2541
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2542
  match(Set dst (DivD src1 (LoadD src2)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2543
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2544
  format %{ "vdivsd  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2545
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2546
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2547
    __ vdivsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2548
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2549
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2550
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2551
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2552
instruct divD_reg_imm(regD dst, regD src, immD con) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2553
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2554
  match(Set dst (DivD src con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2555
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2556
  format %{ "vdivsd  $dst, $src, [$constantaddress]\t# load from constant table: double=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2557
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2558
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2559
    __ vdivsd($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2560
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2561
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2562
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2563
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2564
instruct absF_reg(regF dst) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2565
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2566
  match(Set dst (AbsF dst));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2567
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2568
  format %{ "andps   $dst, [0x7fffffff]\t# abs float by sign masking" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2569
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2570
    __ andps($dst$$XMMRegister, ExternalAddress(float_signmask()));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2571
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2572
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2573
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2574
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2575
instruct absF_reg_reg(vlRegF dst, vlRegF src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2576
  predicate(UseAVX > 0);
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2577
  match(Set dst (AbsF src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2578
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2579
  format %{ "vandps  $dst, $src, [0x7fffffff]\t# abs float by sign masking" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2580
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2581
    int vector_len = 0;
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2582
    __ vandps($dst$$XMMRegister, $src$$XMMRegister,
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2583
              ExternalAddress(float_signmask()), vector_len);
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2584
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2585
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2586
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2587
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2588
instruct absD_reg(regD dst) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2589
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2590
  match(Set dst (AbsD dst));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2591
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2592
  format %{ "andpd   $dst, [0x7fffffffffffffff]\t"
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2593
            "# abs double by sign masking" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2594
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2595
    __ andpd($dst$$XMMRegister, ExternalAddress(double_signmask()));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2596
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2597
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2598
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2599
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2600
instruct absD_reg_reg(vlRegD dst, vlRegD src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2601
  predicate(UseAVX > 0);
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2602
  match(Set dst (AbsD src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2603
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2604
  format %{ "vandpd  $dst, $src, [0x7fffffffffffffff]\t"
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2605
            "# abs double by sign masking" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2606
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2607
    int vector_len = 0;
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2608
    __ vandpd($dst$$XMMRegister, $src$$XMMRegister,
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2609
              ExternalAddress(double_signmask()), vector_len);
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2610
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2611
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2612
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2613
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2614
instruct negF_reg(regF dst) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2615
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2616
  match(Set dst (NegF dst));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2617
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2618
  format %{ "xorps   $dst, [0x80000000]\t# neg float by sign flipping" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2619
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2620
    __ xorps($dst$$XMMRegister, ExternalAddress(float_signflip()));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2621
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2622
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2623
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2624
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2625
instruct negF_reg_reg(vlRegF dst, vlRegF src) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2626
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2627
  match(Set dst (NegF src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2628
  ins_cost(150);
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  2629
  format %{ "vnegatess  $dst, $src, [0x80000000]\t# neg float by sign flipping" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  2630
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  2631
    __ vnegatess($dst$$XMMRegister, $src$$XMMRegister,
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  2632
                 ExternalAddress(float_signflip()));
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2633
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2634
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2635
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2636
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2637
instruct negD_reg(regD dst) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2638
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2639
  match(Set dst (NegD dst));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2640
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2641
  format %{ "xorpd   $dst, [0x8000000000000000]\t"
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2642
            "# neg double by sign flipping" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2643
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2644
    __ xorpd($dst$$XMMRegister, ExternalAddress(double_signflip()));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2645
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2646
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2647
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2648
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2649
instruct negD_reg_reg(vlRegD dst, vlRegD src) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2650
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2651
  match(Set dst (NegD src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2652
  ins_cost(150);
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2653
  format %{ "vnegatesd  $dst, $src, [0x8000000000000000]\t"
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2654
            "# neg double by sign flipping" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2655
  ins_encode %{
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  2656
    __ vnegatesd($dst$$XMMRegister, $src$$XMMRegister,
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  2657
                 ExternalAddress(double_signflip()));
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2658
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2659
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2660
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2661
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2662
instruct sqrtF_reg(regF dst, regF src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2663
  predicate(UseSSE>=1);
48089
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  2664
  match(Set dst (SqrtF src));
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2665
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2666
  format %{ "sqrtss  $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2667
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2668
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2669
    __ sqrtss($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2670
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2671
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2672
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2673
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2674
instruct sqrtF_mem(regF dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2675
  predicate(UseSSE>=1);
48089
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  2676
  match(Set dst (SqrtF (LoadF src)));
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2677
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2678
  format %{ "sqrtss  $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2679
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2680
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2681
    __ sqrtss($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2682
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2683
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2684
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2685
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2686
instruct sqrtF_imm(regF dst, immF con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2687
  predicate(UseSSE>=1);
48089
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  2688
  match(Set dst (SqrtF con));
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  2689
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2690
  format %{ "sqrtss  $dst, [$constantaddress]\t# load from constant table: float=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2691
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2692
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2693
    __ sqrtss($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2694
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2695
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2696
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2697
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2698
instruct sqrtD_reg(regD dst, regD src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2699
  predicate(UseSSE>=2);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2700
  match(Set dst (SqrtD src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2701
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2702
  format %{ "sqrtsd  $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2703
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2704
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2705
    __ sqrtsd($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2706
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2707
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2708
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2709
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2710
instruct sqrtD_mem(regD dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2711
  predicate(UseSSE>=2);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2712
  match(Set dst (SqrtD (LoadD src)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2713
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2714
  format %{ "sqrtsd  $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2715
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2716
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2717
    __ sqrtsd($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2718
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2719
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2720
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2721
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2722
instruct sqrtD_imm(regD dst, immD con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2723
  predicate(UseSSE>=2);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2724
  match(Set dst (SqrtD con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2725
  format %{ "sqrtsd  $dst, [$constantaddress]\t# load from constant table: double=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2726
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2727
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2728
    __ sqrtsd($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2729
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2730
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2731
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2732
58421
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2733
58450
67b3480882b4 8231713: x86_32 build failures after JDK-8226721 (Missing intrinsics for Math.ceil, floor, rint)
shade
parents: 58421
diff changeset
  2734
#ifdef _LP64
58421
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2735
instruct roundD_reg(legRegD dst, legRegD src, immU8 rmode) %{
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2736
  predicate(UseSSE>=4);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2737
  match(Set dst (RoundDoubleMode src rmode));
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2738
  format %{ "roundsd  $dst, $src" %}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2739
  ins_cost(150);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2740
  ins_encode %{
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2741
    __ roundsd($dst$$XMMRegister, $src$$XMMRegister, $rmode$$constant);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2742
  %}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2743
  ins_pipe(pipe_slow);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2744
%}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2745
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2746
instruct roundD_mem(legRegD dst, memory src, immU8 rmode) %{
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2747
  predicate(UseSSE>=4);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2748
  match(Set dst (RoundDoubleMode (LoadD src) rmode));
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2749
  format %{ "roundsd  $dst, $src" %}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2750
  ins_cost(150);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2751
  ins_encode %{
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2752
    __ roundsd($dst$$XMMRegister, $src$$Address, $rmode$$constant);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2753
  %}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2754
  ins_pipe(pipe_slow);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2755
%}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2756
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2757
instruct roundD_imm(legRegD dst, immD con, immU8 rmode, rRegI scratch_reg) %{
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2758
  predicate(UseSSE>=4);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2759
  match(Set dst (RoundDoubleMode con rmode));
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2760
  effect(TEMP scratch_reg);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2761
  format %{ "roundsd $dst, [$constantaddress]\t# load from constant table: double=$con" %}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2762
  ins_cost(150);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2763
  ins_encode %{
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2764
    __ roundsd($dst$$XMMRegister, $constantaddress($con), $rmode$$constant, $scratch_reg$$Register);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2765
  %}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2766
  ins_pipe(pipe_slow);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2767
%}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2768
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2769
instruct vround2D_reg(legVecX dst, legVecX src, immU8 rmode) %{
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2770
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2771
  match(Set dst (RoundDoubleModeV src rmode));
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2772
  format %{ "vroundpd  $dst, $src, $rmode\t! round packed2D" %}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2773
  ins_encode %{
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2774
    int vector_len = 0;
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2775
    __ vroundpd($dst$$XMMRegister, $src$$XMMRegister, $rmode$$constant, vector_len);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2776
  %}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2777
  ins_pipe( pipe_slow );
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2778
%}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2779
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2780
instruct vround2D_mem(legVecX dst, memory mem, immU8 rmode) %{
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2781
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2782
  match(Set dst (RoundDoubleModeV (LoadVector mem) rmode));
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2783
  format %{ "vroundpd $dst, $mem, $rmode\t! round packed2D" %}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2784
  ins_encode %{
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2785
    int vector_len = 0;
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2786
    __ vroundpd($dst$$XMMRegister, $mem$$Address, $rmode$$constant, vector_len);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2787
  %}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2788
  ins_pipe( pipe_slow );
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2789
%}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2790
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2791
instruct vround4D_reg(legVecY dst, legVecY src, legVecY rmode) %{
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2792
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2793
  match(Set dst (RoundDoubleModeV src rmode));
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2794
  format %{ "vroundpd  $dst, $src, $rmode\t! round packed4D" %}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2795
  ins_encode %{
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2796
    int vector_len = 1;
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2797
    __ vroundpd($dst$$XMMRegister, $src$$XMMRegister, $rmode$$constant, vector_len);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2798
  %}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2799
  ins_pipe( pipe_slow );
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2800
%}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2801
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2802
instruct vround4D_mem(legVecY dst, memory mem, immU8 rmode) %{
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2803
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2804
  match(Set dst (RoundDoubleModeV (LoadVector mem) rmode));
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2805
  format %{ "vroundpd $dst, $mem, $rmode\t! round packed4D" %}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2806
  ins_encode %{
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2807
    int vector_len = 1;
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2808
    __ vroundpd($dst$$XMMRegister, $mem$$Address, $rmode$$constant, vector_len);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2809
  %}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2810
  ins_pipe( pipe_slow );
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2811
%}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2812
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2813
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2814
instruct vround8D_reg(vecZ dst, vecZ src, immU8 rmode) %{
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2815
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2816
  match(Set dst (RoundDoubleModeV src rmode));
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2817
  format %{ "vrndscalepd $dst, $src, $rmode\t! round packed8D" %}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2818
  ins_encode %{
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2819
    int vector_len = 2;
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2820
    __ vrndscalepd($dst$$XMMRegister, $src$$XMMRegister, $rmode$$constant, vector_len);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2821
  %}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2822
  ins_pipe( pipe_slow );
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2823
%}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2824
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2825
instruct vround8D_mem(vecZ dst, memory mem, immU8 rmode) %{
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2826
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2827
  match(Set dst (RoundDoubleModeV (LoadVector mem) rmode));
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2828
  format %{ "vrndscalepd $dst, $mem, $rmode\t! round packed8D" %}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2829
  ins_encode %{
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2830
    int vector_len = 2;
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2831
    __ vrndscalepd($dst$$XMMRegister, $mem$$Address, $rmode$$constant, vector_len);
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2832
  %}
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2833
  ins_pipe( pipe_slow );
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2834
%}
58450
67b3480882b4 8231713: x86_32 build failures after JDK-8226721 (Missing intrinsics for Math.ceil, floor, rint)
shade
parents: 58421
diff changeset
  2835
#endif // _LP64
58421
6fc57e391539 8226721: Missing intrinsics for Math.ceil, floor, rint
neliasso
parents: 58061
diff changeset
  2836
38017
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2837
instruct onspinwait() %{
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2838
  match(OnSpinWait);
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2839
  ins_cost(200);
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2840
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2841
  format %{
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2842
    $$template
51996
84743156e780 8188764: Obsolete AssumeMP and then remove all support for non-MP builds
dholmes
parents: 51857
diff changeset
  2843
    $$emit$$"pause\t! membar_onspinwait"
38017
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2844
  %}
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2845
  ins_encode %{
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2846
    __ pause();
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2847
  %}
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2848
  ins_pipe(pipe_slow);
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2849
%}
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2850
41323
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2851
// a * b + c
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2852
instruct fmaD_reg(regD a, regD b, regD c) %{
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2853
  predicate(UseFMA);
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2854
  match(Set c (FmaD  c (Binary a b)));
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2855
  format %{ "fmasd $a,$b,$c\t# $c = $a * $b + $c" %}
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2856
  ins_cost(150);
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2857
  ins_encode %{
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2858
    __ fmad($c$$XMMRegister, $a$$XMMRegister, $b$$XMMRegister, $c$$XMMRegister);
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2859
  %}
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2860
  ins_pipe( pipe_slow );
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2861
%}
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2862
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2863
// a * b + c
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2864
instruct fmaF_reg(regF a, regF b, regF c) %{
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2865
  predicate(UseFMA);
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2866
  match(Set c (FmaF  c (Binary a b)));
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2867
  format %{ "fmass $a,$b,$c\t# $c = $a * $b + $c" %}
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2868
  ins_cost(150);
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2869
  ins_encode %{
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2870
    __ fmaf($c$$XMMRegister, $a$$XMMRegister, $b$$XMMRegister, $c$$XMMRegister);
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2871
  %}
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2872
  ins_pipe( pipe_slow );
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2873
%}
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2874
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2875
// ====================VECTOR INSTRUCTIONS=====================================
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2876
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2877
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2878
// Load vectors (4 bytes long)
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2879
instruct loadV4(vecS dst, memory mem) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2880
  predicate(n->as_LoadVector()->memory_size() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2881
  match(Set dst (LoadVector mem));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2882
  ins_cost(125);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2883
  format %{ "movd    $dst,$mem\t! load vector (4 bytes)" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2884
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2885
    __ movdl($dst$$XMMRegister, $mem$$Address);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2886
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2887
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2888
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2889
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2890
// Load vectors (4 bytes long)
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2891
instruct MoveVecS2Leg(legVecS dst, vecS src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2892
  match(Set dst src);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2893
  format %{ "movss $dst,$src\t! load vector (4 bytes)" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2894
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2895
    __ movflt($dst$$XMMRegister, $src$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2896
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2897
  ins_pipe( fpu_reg_reg );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2898
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2899
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2900
// Load vectors (4 bytes long)
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2901
instruct MoveLeg2VecS(vecS dst, legVecS src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2902
  match(Set dst src);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2903
  format %{ "movss $dst,$src\t! load vector (4 bytes)" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2904
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2905
    __ movflt($dst$$XMMRegister, $src$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2906
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2907
  ins_pipe( fpu_reg_reg );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2908
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2909
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2910
// Load vectors (8 bytes long)
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2911
instruct loadV8(vecD dst, memory mem) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2912
  predicate(n->as_LoadVector()->memory_size() == 8);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2913
  match(Set dst (LoadVector mem));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2914
  ins_cost(125);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2915
  format %{ "movq    $dst,$mem\t! load vector (8 bytes)" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2916
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2917
    __ movq($dst$$XMMRegister, $mem$$Address);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2918
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2919
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2920
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2921
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2922
// Load vectors (8 bytes long)
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2923
instruct MoveVecD2Leg(legVecD dst, vecD src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2924
  match(Set dst src);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2925
  format %{ "movsd $dst,$src\t! load vector (8 bytes)" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2926
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2927
    __ movdbl($dst$$XMMRegister, $src$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2928
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2929
  ins_pipe( fpu_reg_reg );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2930
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2931
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2932
// Load vectors (8 bytes long)
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2933
instruct MoveLeg2VecD(vecD dst, legVecD src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2934
  match(Set dst src);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2935
  format %{ "movsd $dst,$src\t! load vector (8 bytes)" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2936
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2937
    __ movdbl($dst$$XMMRegister, $src$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2938
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2939
  ins_pipe( fpu_reg_reg );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2940
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2941
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2942
// Load vectors (16 bytes long)
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2943
instruct loadV16(vecX dst, memory mem) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2944
  predicate(n->as_LoadVector()->memory_size() == 16);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2945
  match(Set dst (LoadVector mem));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2946
  ins_cost(125);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2947
  format %{ "movdqu  $dst,$mem\t! load vector (16 bytes)" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2948
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2949
    __ movdqu($dst$$XMMRegister, $mem$$Address);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2950
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2951
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2952
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2953
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2954
// Load vectors (16 bytes long)
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2955
instruct MoveVecX2Leg(legVecX dst, vecX src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2956
  match(Set dst src);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2957
  format %{ "movdqu $dst,$src\t! load vector (16 bytes)" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2958
  ins_encode %{
53171
3ab3cb8a8d41 8215888: Register to register spill may use AVX 512 move instruction on unsupported platform.
sviswanathan
parents: 52992
diff changeset
  2959
    if (UseAVX > 2 && !VM_Version::supports_avx512vl()) {
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2960
      int vector_len = 2;
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2961
      __ evmovdquq($dst$$XMMRegister, $src$$XMMRegister, vector_len);
53171
3ab3cb8a8d41 8215888: Register to register spill may use AVX 512 move instruction on unsupported platform.
sviswanathan
parents: 52992
diff changeset
  2962
    } else {
3ab3cb8a8d41 8215888: Register to register spill may use AVX 512 move instruction on unsupported platform.
sviswanathan
parents: 52992
diff changeset
  2963
      __ movdqu($dst$$XMMRegister, $src$$XMMRegister);
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2964
    }
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2965
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2966
  ins_pipe( fpu_reg_reg );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2967
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2968
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2969
// Load vectors (16 bytes long)
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2970
instruct MoveLeg2VecX(vecX dst, legVecX src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2971
  match(Set dst src);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2972
  format %{ "movdqu $dst,$src\t! load vector (16 bytes)" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2973
  ins_encode %{
53171
3ab3cb8a8d41 8215888: Register to register spill may use AVX 512 move instruction on unsupported platform.
sviswanathan
parents: 52992
diff changeset
  2974
    if (UseAVX > 2 && !VM_Version::supports_avx512vl()) {
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2975
      int vector_len = 2;
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2976
      __ evmovdquq($dst$$XMMRegister, $src$$XMMRegister, vector_len);
53171
3ab3cb8a8d41 8215888: Register to register spill may use AVX 512 move instruction on unsupported platform.
sviswanathan
parents: 52992
diff changeset
  2977
    } else {
3ab3cb8a8d41 8215888: Register to register spill may use AVX 512 move instruction on unsupported platform.
sviswanathan
parents: 52992
diff changeset
  2978
      __ movdqu($dst$$XMMRegister, $src$$XMMRegister);
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2979
    }
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2980
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2981
  ins_pipe( fpu_reg_reg );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2982
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2983
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2984
// Load vectors (32 bytes long)
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2985
instruct loadV32(vecY dst, memory mem) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2986
  predicate(n->as_LoadVector()->memory_size() == 32);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2987
  match(Set dst (LoadVector mem));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2988
  ins_cost(125);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2989
  format %{ "vmovdqu $dst,$mem\t! load vector (32 bytes)" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2990
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2991
    __ vmovdqu($dst$$XMMRegister, $mem$$Address);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2992
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2993
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2994
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2995
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2996
// Load vectors (32 bytes long)
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2997
instruct MoveVecY2Leg(legVecY dst, vecY src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2998
  match(Set dst src);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  2999
  format %{ "vmovdqu $dst,$src\t! load vector (32 bytes)" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3000
  ins_encode %{
53171
3ab3cb8a8d41 8215888: Register to register spill may use AVX 512 move instruction on unsupported platform.
sviswanathan
parents: 52992
diff changeset
  3001
    if (UseAVX > 2 && !VM_Version::supports_avx512vl()) {
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3002
      int vector_len = 2;
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3003
      __ evmovdquq($dst$$XMMRegister, $src$$XMMRegister, vector_len);
53171
3ab3cb8a8d41 8215888: Register to register spill may use AVX 512 move instruction on unsupported platform.
sviswanathan
parents: 52992
diff changeset
  3004
    } else {
3ab3cb8a8d41 8215888: Register to register spill may use AVX 512 move instruction on unsupported platform.
sviswanathan
parents: 52992
diff changeset
  3005
      __ vmovdqu($dst$$XMMRegister, $src$$XMMRegister);
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3006
    }
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3007
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3008
  ins_pipe( fpu_reg_reg );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3009
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3010
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3011
// Load vectors (32 bytes long)
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3012
instruct MoveLeg2VecY(vecY dst, legVecY src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3013
  match(Set dst src);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3014
  format %{ "vmovdqu $dst,$src\t! load vector (32 bytes)" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3015
  ins_encode %{
53171
3ab3cb8a8d41 8215888: Register to register spill may use AVX 512 move instruction on unsupported platform.
sviswanathan
parents: 52992
diff changeset
  3016
    if (UseAVX > 2 && !VM_Version::supports_avx512vl()) {
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3017
      int vector_len = 2;
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3018
      __ evmovdquq($dst$$XMMRegister, $src$$XMMRegister, vector_len);
53171
3ab3cb8a8d41 8215888: Register to register spill may use AVX 512 move instruction on unsupported platform.
sviswanathan
parents: 52992
diff changeset
  3019
    } else {
3ab3cb8a8d41 8215888: Register to register spill may use AVX 512 move instruction on unsupported platform.
sviswanathan
parents: 52992
diff changeset
  3020
      __ vmovdqu($dst$$XMMRegister, $src$$XMMRegister);
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3021
    }
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3022
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3023
  ins_pipe( fpu_reg_reg );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3024
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3025
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3026
// Load vectors (64 bytes long)
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3027
instruct loadV64_dword(vecZ dst, memory mem) %{
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3028
  predicate(n->as_LoadVector()->memory_size() == 64 && n->as_LoadVector()->element_size() <= 4);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3029
  match(Set dst (LoadVector mem));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3030
  ins_cost(125);
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3031
  format %{ "vmovdqul $dst k0,$mem\t! load vector (64 bytes)" %}
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3032
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3033
    int vector_len = 2;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3034
    __ evmovdqul($dst$$XMMRegister, $mem$$Address, vector_len);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3035
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3036
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3037
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3038
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3039
// Load vectors (64 bytes long)
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3040
instruct loadV64_qword(vecZ dst, memory mem) %{
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3041
  predicate(n->as_LoadVector()->memory_size() == 64 && n->as_LoadVector()->element_size() > 4);
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3042
  match(Set dst (LoadVector mem));
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3043
  ins_cost(125);
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3044
  format %{ "vmovdquq $dst k0,$mem\t! load vector (64 bytes)" %}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3045
  ins_encode %{
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3046
    int vector_len = 2;
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3047
    __ evmovdquq($dst$$XMMRegister, $mem$$Address, vector_len);
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3048
  %}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3049
  ins_pipe( pipe_slow );
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3050
%}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3051
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3052
instruct MoveVecZ2Leg(legVecZ dst, vecZ  src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3053
  match(Set dst src);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3054
  format %{ "vmovdquq $dst k0,$src\t! Move vector (64 bytes)" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3055
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3056
    int vector_len = 2;
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3057
    __ evmovdquq($dst$$XMMRegister, $src$$XMMRegister, vector_len);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3058
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3059
  ins_pipe( fpu_reg_reg );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3060
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3061
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3062
instruct MoveLeg2VecZ(vecZ dst, legVecZ  src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3063
  match(Set dst src);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3064
  format %{ "vmovdquq $dst k0,$src\t! Move vector (64 bytes)" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3065
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3066
    int vector_len = 2;
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3067
    __ evmovdquq($dst$$XMMRegister, $src$$XMMRegister, vector_len);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3068
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3069
  ins_pipe( fpu_reg_reg );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3070
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3071
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3072
// Store vectors
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3073
instruct storeV4(memory mem, vecS src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3074
  predicate(n->as_StoreVector()->memory_size() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3075
  match(Set mem (StoreVector mem src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3076
  ins_cost(145);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3077
  format %{ "movd    $mem,$src\t! store vector (4 bytes)" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3078
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3079
    __ movdl($mem$$Address, $src$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3080
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3081
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3082
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3083
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3084
instruct storeV8(memory mem, vecD src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3085
  predicate(n->as_StoreVector()->memory_size() == 8);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3086
  match(Set mem (StoreVector mem src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3087
  ins_cost(145);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3088
  format %{ "movq    $mem,$src\t! store vector (8 bytes)" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3089
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3090
    __ movq($mem$$Address, $src$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3091
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3092
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3093
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3094
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3095
instruct storeV16(memory mem, vecX src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3096
  predicate(n->as_StoreVector()->memory_size() == 16);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3097
  match(Set mem (StoreVector mem src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3098
  ins_cost(145);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3099
  format %{ "movdqu  $mem,$src\t! store vector (16 bytes)" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3100
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3101
    __ movdqu($mem$$Address, $src$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3102
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3103
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3104
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3105
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3106
instruct storeV32(memory mem, vecY src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3107
  predicate(n->as_StoreVector()->memory_size() == 32);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3108
  match(Set mem (StoreVector mem src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3109
  ins_cost(145);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3110
  format %{ "vmovdqu $mem,$src\t! store vector (32 bytes)" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3111
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3112
    __ vmovdqu($mem$$Address, $src$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3113
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3114
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3115
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3116
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3117
instruct storeV64_dword(memory mem, vecZ src) %{
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3118
  predicate(n->as_StoreVector()->memory_size() == 64 && n->as_StoreVector()->element_size() <= 4);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3119
  match(Set mem (StoreVector mem src));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3120
  ins_cost(145);
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3121
  format %{ "vmovdqul $mem k0,$src\t! store vector (64 bytes)" %}
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3122
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3123
    int vector_len = 2;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3124
    __ evmovdqul($mem$$Address, $src$$XMMRegister, vector_len);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3125
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3126
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3127
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3128
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3129
instruct storeV64_qword(memory mem, vecZ src) %{
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3130
  predicate(n->as_StoreVector()->memory_size() == 64 && n->as_StoreVector()->element_size() > 4);
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3131
  match(Set mem (StoreVector mem src));
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3132
  ins_cost(145);
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3133
  format %{ "vmovdquq $mem k0,$src\t! store vector (64 bytes)" %}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3134
  ins_encode %{
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3135
    int vector_len = 2;
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3136
    __ evmovdquq($mem$$Address, $src$$XMMRegister, vector_len);
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3137
  %}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3138
  ins_pipe( pipe_slow );
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3139
%}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  3140
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3141
// ====================LEGACY REPLICATE=======================================
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3142
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3143
instruct Repl16B(vecX dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3144
  predicate(n->as_Vector()->length() == 16 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3145
  match(Set dst (ReplicateB src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3146
  format %{ "movd    $dst,$src\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3147
            "punpcklbw $dst,$dst\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3148
            "pshuflw $dst,$dst,0x00\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3149
            "punpcklqdq $dst,$dst\t! replicate16B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3150
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3151
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3152
    __ punpcklbw($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3153
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3154
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3155
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3156
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3157
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3158
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3159
instruct Repl32B(vecY dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3160
  predicate(n->as_Vector()->length() == 32 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3161
  match(Set dst (ReplicateB src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3162
  format %{ "movd    $dst,$src\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3163
            "punpcklbw $dst,$dst\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3164
            "pshuflw $dst,$dst,0x00\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3165
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3166
            "vinserti128_high $dst,$dst\t! replicate32B" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3167
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3168
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3169
    __ punpcklbw($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3170
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3171
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3172
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3173
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3174
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3175
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3176
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3177
instruct Repl64B(legVecZ dst, rRegI src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3178
  predicate(n->as_Vector()->length() == 64 && !VM_Version::supports_avx512vlbw());
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3179
  match(Set dst (ReplicateB src));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3180
  format %{ "movd    $dst,$src\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3181
            "punpcklbw $dst,$dst\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3182
            "pshuflw $dst,$dst,0x00\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3183
            "punpcklqdq $dst,$dst\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3184
            "vinserti128_high $dst,$dst\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3185
            "vinserti64x4 $dst,$dst,$dst,0x1\t! replicate64B" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3186
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3187
    __ movdl($dst$$XMMRegister, $src$$Register);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3188
    __ punpcklbw($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3189
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3190
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3191
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3192
    __ vinserti64x4($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, 0x1);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3193
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3194
  ins_pipe( pipe_slow );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3195
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3196
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3197
instruct Repl16B_imm(vecX dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3198
  predicate(n->as_Vector()->length() == 16 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3199
  match(Set dst (ReplicateB con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3200
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3201
            "punpcklqdq $dst,$dst\t! replicate16B($con)" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3202
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3203
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 1)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3204
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3205
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3206
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3207
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3208
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3209
instruct Repl32B_imm(vecY dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3210
  predicate(n->as_Vector()->length() == 32 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3211
  match(Set dst (ReplicateB con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3212
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3213
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3214
            "vinserti128_high $dst,$dst\t! lreplicate32B($con)" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3215
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3216
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 1)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3217
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3218
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3219
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3220
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3221
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3222
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3223
instruct Repl64B_imm(legVecZ dst, immI con) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3224
  predicate(n->as_Vector()->length() == 64 && !VM_Version::supports_avx512vlbw());
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3225
  match(Set dst (ReplicateB con));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3226
  format %{ "movq    $dst,[$constantaddress]\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3227
            "punpcklqdq $dst,$dst\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3228
            "vinserti128_high $dst,$dst\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3229
            "vinserti64x4 $dst,$dst,$dst,0x1\t! replicate64B($con)" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3230
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3231
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 1)));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3232
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3233
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3234
    __ vinserti64x4($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, 0x1);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3235
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3236
  ins_pipe( pipe_slow );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3237
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3238
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3239
instruct Repl4S(vecD dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3240
  predicate(n->as_Vector()->length() == 4 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3241
  match(Set dst (ReplicateS src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3242
  format %{ "movd    $dst,$src\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3243
            "pshuflw $dst,$dst,0x00\t! replicate4S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3244
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3245
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3246
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3247
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3248
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3249
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3250
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3251
instruct Repl4S_mem(vecD dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3252
  predicate(n->as_Vector()->length() == 4 && UseAVX > 0 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3253
  match(Set dst (ReplicateS (LoadS mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3254
  format %{ "pshuflw $dst,$mem,0x00\t! replicate4S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3255
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3256
    __ pshuflw($dst$$XMMRegister, $mem$$Address, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3257
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3258
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3259
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3260
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3261
instruct Repl8S(vecX dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3262
  predicate(n->as_Vector()->length() == 8 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3263
  match(Set dst (ReplicateS src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3264
  format %{ "movd    $dst,$src\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3265
            "pshuflw $dst,$dst,0x00\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3266
            "punpcklqdq $dst,$dst\t! replicate8S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3267
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3268
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3269
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3270
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3271
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3272
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3273
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3274
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3275
instruct Repl8S_mem(vecX dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3276
  predicate(n->as_Vector()->length() == 8 && UseAVX > 0 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3277
  match(Set dst (ReplicateS (LoadS mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3278
  format %{ "pshuflw $dst,$mem,0x00\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3279
            "punpcklqdq $dst,$dst\t! replicate8S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3280
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3281
    __ pshuflw($dst$$XMMRegister, $mem$$Address, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3282
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3283
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3284
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3285
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3286
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3287
instruct Repl8S_imm(vecX dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3288
  predicate(n->as_Vector()->length() == 8 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3289
  match(Set dst (ReplicateS con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3290
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3291
            "punpcklqdq $dst,$dst\t! replicate8S($con)" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3292
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3293
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 2)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3294
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3295
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3296
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3297
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3298
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3299
instruct Repl16S(vecY dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3300
  predicate(n->as_Vector()->length() == 16 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3301
  match(Set dst (ReplicateS src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3302
  format %{ "movd    $dst,$src\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3303
            "pshuflw $dst,$dst,0x00\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3304
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3305
            "vinserti128_high $dst,$dst\t! replicate16S" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3306
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3307
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3308
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3309
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3310
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3311
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3312
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3313
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3314
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3315
instruct Repl16S_mem(vecY dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3316
  predicate(n->as_Vector()->length() == 16 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3317
  match(Set dst (ReplicateS (LoadS mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3318
  format %{ "pshuflw $dst,$mem,0x00\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3319
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3320
            "vinserti128_high $dst,$dst\t! replicate16S" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3321
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3322
    __ pshuflw($dst$$XMMRegister, $mem$$Address, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3323
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3324
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3325
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3326
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3327
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3328
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3329
instruct Repl16S_imm(vecY dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3330
  predicate(n->as_Vector()->length() == 16 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3331
  match(Set dst (ReplicateS con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3332
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3333
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3334
            "vinserti128_high $dst,$dst\t! replicate16S($con)" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3335
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3336
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 2)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3337
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3338
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3339
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3340
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3341
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3342
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3343
instruct Repl32S(legVecZ dst, rRegI src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3344
  predicate(n->as_Vector()->length() == 32 && !VM_Version::supports_avx512vlbw());
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3345
  match(Set dst (ReplicateS src));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3346
  format %{ "movd    $dst,$src\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3347
            "pshuflw $dst,$dst,0x00\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3348
            "punpcklqdq $dst,$dst\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3349
            "vinserti128_high $dst,$dst\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3350
            "vinserti64x4 $dst,$dst,$dst,0x1\t! replicate32S" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3351
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3352
    __ movdl($dst$$XMMRegister, $src$$Register);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3353
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3354
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3355
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3356
    __ vinserti64x4($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, 0x1);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3357
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3358
  ins_pipe( pipe_slow );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3359
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3360
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3361
instruct Repl32S_mem(legVecZ dst, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3362
  predicate(n->as_Vector()->length() == 32 && !VM_Version::supports_avx512vlbw());
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3363
  match(Set dst (ReplicateS (LoadS mem)));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3364
  format %{ "pshuflw $dst,$mem,0x00\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3365
            "punpcklqdq $dst,$dst\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3366
            "vinserti128_high $dst,$dst\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3367
            "vinserti64x4 $dst,$dst,$dst,0x1\t! replicate32S" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3368
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3369
    __ pshuflw($dst$$XMMRegister, $mem$$Address, 0x00);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3370
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3371
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3372
    __ vinserti64x4($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, 0x1);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3373
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3374
  ins_pipe( pipe_slow );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3375
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3376
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3377
instruct Repl32S_imm(legVecZ dst, immI con) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3378
  predicate(n->as_Vector()->length() == 32 && !VM_Version::supports_avx512vlbw());
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3379
  match(Set dst (ReplicateS con));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3380
  format %{ "movq    $dst,[$constantaddress]\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3381
            "punpcklqdq $dst,$dst\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3382
            "vinserti128_high $dst,$dst\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3383
            "vinserti64x4 $dst,$dst,$dst,0x1\t! replicate32S($con)" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3384
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3385
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 2)));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3386
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3387
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3388
    __ vinserti64x4($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, 0x1);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3389
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3390
  ins_pipe( pipe_slow );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3391
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3392
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3393
instruct Repl4I(vecX dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3394
  predicate(n->as_Vector()->length() == 4 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3395
  match(Set dst (ReplicateI src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3396
  format %{ "movd    $dst,$src\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3397
            "pshufd  $dst,$dst,0x00\t! replicate4I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3398
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3399
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3400
    __ pshufd($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3401
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3402
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3403
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3404
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3405
instruct Repl4I_mem(vecX dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3406
  predicate(n->as_Vector()->length() == 4 && UseAVX > 0 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3407
  match(Set dst (ReplicateI (LoadI mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3408
  format %{ "pshufd  $dst,$mem,0x00\t! replicate4I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3409
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3410
    __ pshufd($dst$$XMMRegister, $mem$$Address, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3411
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3412
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3413
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3414
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3415
instruct Repl8I(vecY dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3416
  predicate(n->as_Vector()->length() == 8 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3417
  match(Set dst (ReplicateI src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3418
  format %{ "movd    $dst,$src\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3419
            "pshufd  $dst,$dst,0x00\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3420
            "vinserti128_high $dst,$dst\t! replicate8I" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3421
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3422
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3423
    __ pshufd($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3424
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3425
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3426
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3427
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3428
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3429
instruct Repl8I_mem(vecY dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3430
  predicate(n->as_Vector()->length() == 8 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3431
  match(Set dst (ReplicateI (LoadI mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3432
  format %{ "pshufd  $dst,$mem,0x00\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3433
            "vinserti128_high $dst,$dst\t! replicate8I" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3434
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3435
    __ pshufd($dst$$XMMRegister, $mem$$Address, 0x00);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3436
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3437
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3438
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3439
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3440
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3441
instruct Repl16I(legVecZ dst, rRegI src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3442
  predicate(n->as_Vector()->length() == 16 && !VM_Version::supports_avx512vl());
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3443
  match(Set dst (ReplicateI src));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3444
  format %{ "movd    $dst,$src\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3445
            "pshufd  $dst,$dst,0x00\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3446
            "vinserti128_high $dst,$dst\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3447
            "vinserti64x4 $dst,$dst,$dst,0x1\t! replicate16I" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3448
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3449
    __ movdl($dst$$XMMRegister, $src$$Register);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3450
    __ pshufd($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3451
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3452
    __ vinserti64x4($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, 0x1);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3453
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3454
  ins_pipe( pipe_slow );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3455
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3456
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3457
instruct Repl16I_mem(legVecZ dst, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3458
  predicate(n->as_Vector()->length() == 16 && !VM_Version::supports_avx512vl());
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3459
  match(Set dst (ReplicateI (LoadI mem)));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3460
  format %{ "pshufd  $dst,$mem,0x00\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3461
            "vinserti128_high $dst,$dst\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3462
            "vinserti64x4 $dst,$dst,$dst,0x1\t! replicate16I" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3463
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3464
    __ pshufd($dst$$XMMRegister, $mem$$Address, 0x00);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3465
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3466
    __ vinserti64x4($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, 0x1);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3467
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3468
  ins_pipe( pipe_slow );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3469
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3470
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3471
instruct Repl4I_imm(vecX dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3472
  predicate(n->as_Vector()->length() == 4 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3473
  match(Set dst (ReplicateI con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3474
  format %{ "movq    $dst,[$constantaddress]\t! replicate4I($con)\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3475
            "punpcklqdq $dst,$dst" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3476
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3477
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 4)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3478
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3479
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3480
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3481
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3482
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3483
instruct Repl8I_imm(vecY dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3484
  predicate(n->as_Vector()->length() == 8 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3485
  match(Set dst (ReplicateI con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3486
  format %{ "movq    $dst,[$constantaddress]\t! replicate8I($con)\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3487
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3488
            "vinserti128_high $dst,$dst" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3489
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3490
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 4)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3491
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3492
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3493
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3494
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3495
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3496
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3497
instruct Repl16I_imm(legVecZ dst, immI con) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3498
  predicate(n->as_Vector()->length() == 16 && !VM_Version::supports_avx512vl());
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3499
  match(Set dst (ReplicateI con));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3500
  format %{ "movq    $dst,[$constantaddress]\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3501
            "punpcklqdq $dst,$dst\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3502
            "vinserti128_high $dst,$dst"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3503
            "vinserti64x4 $dst,$dst,$dst,0x1\t! replicate16I($con)" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3504
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3505
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 4)));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3506
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3507
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3508
    __ vinserti64x4($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, 0x1);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3509
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3510
  ins_pipe( pipe_slow );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3511
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3512
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3513
// Long could be loaded into xmm register directly from memory.
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3514
instruct Repl2L_mem(vecX dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3515
  predicate(n->as_Vector()->length() == 2 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3516
  match(Set dst (ReplicateL (LoadL mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3517
  format %{ "movq    $dst,$mem\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3518
            "punpcklqdq $dst,$dst\t! replicate2L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3519
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3520
    __ movq($dst$$XMMRegister, $mem$$Address);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3521
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3522
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3523
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3524
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3525
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3526
// Replicate long (8 byte) scalar to be vector
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3527
#ifdef _LP64
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3528
instruct Repl4L(vecY dst, rRegL src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3529
  predicate(n->as_Vector()->length() == 4 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3530
  match(Set dst (ReplicateL src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3531
  format %{ "movdq   $dst,$src\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3532
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3533
            "vinserti128_high $dst,$dst\t! replicate4L" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3534
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3535
    __ movdq($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3536
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3537
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3538
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3539
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3540
%}
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3541
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3542
instruct Repl8L(legVecZ dst, rRegL src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3543
  predicate(n->as_Vector()->length() == 8 && !VM_Version::supports_avx512vl());
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3544
  match(Set dst (ReplicateL src));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3545
  format %{ "movdq   $dst,$src\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3546
            "punpcklqdq $dst,$dst\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3547
            "vinserti128_high $dst,$dst\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3548
            "vinserti64x4 $dst,$dst,$dst,0x1\t! replicate8L" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3549
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3550
    __ movdq($dst$$XMMRegister, $src$$Register);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3551
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3552
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3553
    __ vinserti64x4($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, 0x1);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3554
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3555
  ins_pipe( pipe_slow );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3556
%}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3557
#else // _LP64
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3558
instruct Repl4L(vecY dst, eRegL src, vecY tmp) %{
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3559
  predicate(n->as_Vector()->length() == 4 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3560
  match(Set dst (ReplicateL src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3561
  effect(TEMP dst, USE src, TEMP tmp);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3562
  format %{ "movdl   $dst,$src.lo\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3563
            "movdl   $tmp,$src.hi\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3564
            "punpckldq $dst,$tmp\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3565
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3566
            "vinserti128_high $dst,$dst\t! replicate4L" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3567
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3568
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3569
    __ movdl($tmp$$XMMRegister, HIGH_FROM_LOW($src$$Register));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3570
    __ punpckldq($dst$$XMMRegister, $tmp$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3571
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3572
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3573
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3574
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3575
%}
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3576
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3577
instruct Repl8L(legVecZ dst, eRegL src, legVecZ tmp) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3578
  predicate(n->as_Vector()->length() == 8 && !VM_Version::supports_avx512vl());
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3579
  match(Set dst (ReplicateL src));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3580
  effect(TEMP dst, USE src, TEMP tmp);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3581
  format %{ "movdl   $dst,$src.lo\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3582
            "movdl   $tmp,$src.hi\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3583
            "punpckldq $dst,$tmp\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3584
            "punpcklqdq $dst,$dst\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3585
            "vinserti128_high $dst,$dst\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3586
            "vinserti64x4 $dst,$dst,$dst,0x1\t! replicate8L" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3587
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3588
    __ movdl($dst$$XMMRegister, $src$$Register);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3589
    __ movdl($tmp$$XMMRegister, HIGH_FROM_LOW($src$$Register));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3590
    __ punpckldq($dst$$XMMRegister, $tmp$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3591
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3592
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3593
    __ vinserti64x4($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, 0x1);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3594
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3595
  ins_pipe( pipe_slow );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3596
%}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3597
#endif // _LP64
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3598
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3599
instruct Repl4L_imm(vecY dst, immL con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3600
  predicate(n->as_Vector()->length() == 4 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3601
  match(Set dst (ReplicateL con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3602
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3603
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3604
            "vinserti128_high $dst,$dst\t! replicate4L($con)" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3605
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3606
    __ movq($dst$$XMMRegister, $constantaddress($con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3607
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3608
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3609
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3610
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3611
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3612
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3613
instruct Repl8L_imm(legVecZ dst, immL con) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3614
  predicate(n->as_Vector()->length() == 8 && !VM_Version::supports_avx512vl());
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3615
  match(Set dst (ReplicateL con));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3616
  format %{ "movq    $dst,[$constantaddress]\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3617
            "punpcklqdq $dst,$dst\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3618
            "vinserti128_high $dst,$dst\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3619
            "vinserti64x4 $dst,$dst,$dst,0x1\t! replicate8L($con)" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3620
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3621
    __ movq($dst$$XMMRegister, $constantaddress($con));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3622
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3623
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3624
    __ vinserti64x4($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, 0x1);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3625
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3626
  ins_pipe( pipe_slow );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3627
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3628
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3629
instruct Repl4L_mem(vecY dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3630
  predicate(n->as_Vector()->length() == 4 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3631
  match(Set dst (ReplicateL (LoadL mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3632
  format %{ "movq    $dst,$mem\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3633
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3634
            "vinserti128_high $dst,$dst\t! replicate4L" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3635
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3636
    __ movq($dst$$XMMRegister, $mem$$Address);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3637
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3638
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3639
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3640
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3641
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3642
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3643
instruct Repl8L_mem(legVecZ dst, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3644
  predicate(n->as_Vector()->length() == 8 && !VM_Version::supports_avx512vl());
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3645
  match(Set dst (ReplicateL (LoadL mem)));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3646
  format %{ "movq    $dst,$mem\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3647
            "punpcklqdq $dst,$dst\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3648
            "vinserti128_high $dst,$dst\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3649
            "vinserti64x4 $dst,$dst,$dst,0x1\t! replicate8L" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3650
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3651
    __ movq($dst$$XMMRegister, $mem$$Address);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3652
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3653
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3654
    __ vinserti64x4($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, 0x1);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3655
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3656
  ins_pipe( pipe_slow );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3657
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3658
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3659
instruct Repl2F_mem(vecD dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3660
  predicate(n->as_Vector()->length() == 2 && UseAVX > 0 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3661
  match(Set dst (ReplicateF (LoadF mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3662
  format %{ "pshufd  $dst,$mem,0x00\t! replicate2F" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3663
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3664
    __ pshufd($dst$$XMMRegister, $mem$$Address, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3665
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3666
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3667
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3668
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3669
instruct Repl4F_mem(vecX dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3670
  predicate(n->as_Vector()->length() == 4 && UseAVX > 0 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3671
  match(Set dst (ReplicateF (LoadF mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3672
  format %{ "pshufd  $dst,$mem,0x00\t! replicate4F" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3673
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3674
    __ pshufd($dst$$XMMRegister, $mem$$Address, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3675
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3676
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3677
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3678
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3679
instruct Repl8F(vecY dst, vlRegF src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3680
  predicate(n->as_Vector()->length() == 8 && UseAVX > 0 && !VM_Version::supports_avx512vl());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3681
  match(Set dst (ReplicateF src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3682
  format %{ "pshufd  $dst,$src,0x00\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3683
            "vinsertf128_high $dst,$dst\t! replicate8F" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3684
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3685
    __ pshufd($dst$$XMMRegister, $src$$XMMRegister, 0x00);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3686
    __ vinsertf128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3687
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3688
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3689
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3690
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3691
instruct Repl8F_mem(vecY dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3692
  predicate(n->as_Vector()->length() == 8 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3693
  match(Set dst (ReplicateF (LoadF mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3694
  format %{ "pshufd  $dst,$mem,0x00\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3695
            "vinsertf128_high $dst,$dst\t! replicate8F" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3696
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3697
    __ pshufd($dst$$XMMRegister, $mem$$Address, 0x00);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3698
    __ vinsertf128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3699
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3700
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3701
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3702
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3703
instruct Repl16F(legVecZ dst, vlRegF src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3704
  predicate(n->as_Vector()->length() == 16 && UseAVX > 0 && !VM_Version::supports_avx512vl());
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3705
  match(Set dst (ReplicateF src));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3706
  format %{ "pshufd  $dst,$src,0x00\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3707
            "vinsertf128_high $dst,$dst\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3708
            "vinserti64x4 $dst,$dst,$dst,0x1\t! replicate16F" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3709
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3710
    __ pshufd($dst$$XMMRegister, $src$$XMMRegister, 0x00);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3711
    __ vinsertf128_high($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3712
    __ vinserti64x4($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, 0x1);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3713
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3714
  ins_pipe( pipe_slow );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3715
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3716
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3717
instruct Repl16F_mem(legVecZ dst, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3718
  predicate(n->as_Vector()->length() == 16 && !VM_Version::supports_avx512vl());
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3719
  match(Set dst (ReplicateF (LoadF mem)));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3720
  format %{ "pshufd  $dst,$mem,0x00\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3721
            "vinsertf128_high $dst,$dst\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3722
            "vinserti64x4 $dst,$dst,$dst,0x1\t! replicate16F" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3723
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3724
    __ pshufd($dst$$XMMRegister, $mem$$Address, 0x00);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3725
    __ vinsertf128_high($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3726
    __ vinserti64x4($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, 0x1);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3727
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3728
  ins_pipe( pipe_slow );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3729
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3730
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3731
instruct Repl2F_zero(vecD dst, immF0 zero) %{
58462
c6f1226cfb72 8221092: UseAVX=3 has performance degredation on Skylake (X7) processors
vdeshpande
parents: 58450
diff changeset
  3732
  predicate(n->as_Vector()->length() == 2);
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3733
  match(Set dst (ReplicateF zero));
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3734
  format %{ "xorps   $dst,$dst\t! replicate2F zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3735
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3736
    __ xorps($dst$$XMMRegister, $dst$$XMMRegister);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3737
  %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3738
  ins_pipe( fpu_reg_reg );
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3739
%}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3740
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3741
instruct Repl4F_zero(vecX dst, immF0 zero) %{
58462
c6f1226cfb72 8221092: UseAVX=3 has performance degredation on Skylake (X7) processors
vdeshpande
parents: 58450
diff changeset
  3742
  predicate(n->as_Vector()->length() == 4);
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3743
  match(Set dst (ReplicateF zero));
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3744
  format %{ "xorps   $dst,$dst\t! replicate4F zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3745
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3746
    __ xorps($dst$$XMMRegister, $dst$$XMMRegister);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3747
  %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3748
  ins_pipe( fpu_reg_reg );
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3749
%}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3750
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3751
instruct Repl8F_zero(vecY dst, immF0 zero) %{
58462
c6f1226cfb72 8221092: UseAVX=3 has performance degredation on Skylake (X7) processors
vdeshpande
parents: 58450
diff changeset
  3752
  predicate(n->as_Vector()->length() == 8 && UseAVX > 0);
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3753
  match(Set dst (ReplicateF zero));
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3754
  format %{ "vxorps  $dst,$dst,$dst\t! replicate8F zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3755
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3756
    int vector_len = 1;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3757
    __ vxorps($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, vector_len);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3758
  %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3759
  ins_pipe( fpu_reg_reg );
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3760
%}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3761
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3762
instruct Repl2D_mem(vecX dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3763
  predicate(n->as_Vector()->length() == 2 && UseAVX > 0 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3764
  match(Set dst (ReplicateD (LoadD mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3765
  format %{ "pshufd  $dst,$mem,0x44\t! replicate2D" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3766
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3767
    __ pshufd($dst$$XMMRegister, $mem$$Address, 0x44);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3768
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3769
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3770
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3771
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3772
instruct Repl4D(vecY dst, vlRegD src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3773
  predicate(n->as_Vector()->length() == 4 && UseAVX > 0 && !VM_Version::supports_avx512vl());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3774
  match(Set dst (ReplicateD src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3775
  format %{ "pshufd  $dst,$src,0x44\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3776
            "vinsertf128_high $dst,$dst\t! replicate4D" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3777
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3778
    __ pshufd($dst$$XMMRegister, $src$$XMMRegister, 0x44);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3779
    __ vinsertf128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3780
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3781
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3782
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3783
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3784
instruct Repl4D_mem(vecY dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3785
  predicate(n->as_Vector()->length() == 4 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3786
  match(Set dst (ReplicateD (LoadD mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3787
  format %{ "pshufd  $dst,$mem,0x44\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3788
            "vinsertf128_high $dst,$dst\t! replicate4D" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3789
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3790
    __ pshufd($dst$$XMMRegister, $mem$$Address, 0x44);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3791
    __ vinsertf128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3792
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3793
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3794
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3795
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3796
instruct Repl8D(legVecZ dst, vlRegD src) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3797
  predicate(n->as_Vector()->length() == 8 && UseAVX > 0 && !VM_Version::supports_avx512vl());
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3798
  match(Set dst (ReplicateD src));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3799
  format %{ "pshufd  $dst,$src,0x44\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3800
            "vinsertf128_high $dst,$dst\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3801
            "vinserti64x4 $dst,$dst,$dst,0x1\t! replicate8D" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3802
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3803
    __ pshufd($dst$$XMMRegister, $src$$XMMRegister, 0x44);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3804
    __ vinsertf128_high($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3805
    __ vinserti64x4($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, 0x1);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3806
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3807
  ins_pipe( pipe_slow );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3808
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3809
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3810
instruct Repl8D_mem(legVecZ dst, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3811
  predicate(n->as_Vector()->length() == 8 && !VM_Version::supports_avx512vl());
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3812
  match(Set dst (ReplicateD (LoadD mem)));
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3813
  format %{ "pshufd  $dst,$mem,0x44\n\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3814
            "vinsertf128_high $dst,$dst\t"
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3815
            "vinserti64x4 $dst,$dst,$dst,0x1\t! replicate8D" %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3816
  ins_encode %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3817
    __ pshufd($dst$$XMMRegister, $mem$$Address, 0x44);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3818
    __ vinsertf128_high($dst$$XMMRegister, $dst$$XMMRegister);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3819
    __ vinserti64x4($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, 0x1);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3820
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3821
  ins_pipe( pipe_slow );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3822
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  3823
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3824
// Replicate double (8 byte) scalar zero to be vector
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3825
instruct Repl2D_zero(vecX dst, immD0 zero) %{
58462
c6f1226cfb72 8221092: UseAVX=3 has performance degredation on Skylake (X7) processors
vdeshpande
parents: 58450
diff changeset
  3826
  predicate(n->as_Vector()->length() == 2);
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3827
  match(Set dst (ReplicateD zero));
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3828
  format %{ "xorpd   $dst,$dst\t! replicate2D zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3829
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3830
    __ xorpd($dst$$XMMRegister, $dst$$XMMRegister);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3831
  %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3832
  ins_pipe( fpu_reg_reg );
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3833
%}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3834
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3835
instruct Repl4D_zero(vecY dst, immD0 zero) %{
58462
c6f1226cfb72 8221092: UseAVX=3 has performance degredation on Skylake (X7) processors
vdeshpande
parents: 58450
diff changeset
  3836
  predicate(n->as_Vector()->length() == 4 && UseAVX > 0);
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3837
  match(Set dst (ReplicateD zero));
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3838
  format %{ "vxorpd  $dst,$dst,$dst,vect256\t! replicate4D zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3839
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3840
    int vector_len = 1;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3841
    __ vxorpd($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, vector_len);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3842
  %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3843
  ins_pipe( fpu_reg_reg );
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3844
%}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3845
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3846
// ====================GENERIC REPLICATE==========================================
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3847
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3848
// Replicate byte scalar to be vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3849
instruct Repl4B(vecS dst, rRegI src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3850
  predicate(n->as_Vector()->length() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3851
  match(Set dst (ReplicateB src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3852
  format %{ "movd    $dst,$src\n\t"
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3853
            "punpcklbw $dst,$dst\n\t"
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3854
            "pshuflw $dst,$dst,0x00\t! replicate4B" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3855
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3856
    __ movdl($dst$$XMMRegister, $src$$Register);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3857
    __ punpcklbw($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3858
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3859
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3860
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3861
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3862
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3863
instruct Repl8B(vecD dst, rRegI src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3864
  predicate(n->as_Vector()->length() == 8);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3865
  match(Set dst (ReplicateB src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3866
  format %{ "movd    $dst,$src\n\t"
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3867
            "punpcklbw $dst,$dst\n\t"
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3868
            "pshuflw $dst,$dst,0x00\t! replicate8B" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3869
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3870
    __ movdl($dst$$XMMRegister, $src$$Register);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3871
    __ punpcklbw($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3872
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3873
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3874
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3875
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3876
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3877
// Replicate byte scalar immediate to be vector by loading from const table.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3878
instruct Repl4B_imm(vecS dst, immI con) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3879
  predicate(n->as_Vector()->length() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3880
  match(Set dst (ReplicateB con));
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3881
  format %{ "movdl   $dst,[$constantaddress]\t! replicate4B($con)" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3882
  ins_encode %{
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3883
    __ movdl($dst$$XMMRegister, $constantaddress(replicate4_imm($con$$constant, 1)));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3884
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3885
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3886
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3887
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3888
instruct Repl8B_imm(vecD dst, immI con) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3889
  predicate(n->as_Vector()->length() == 8);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3890
  match(Set dst (ReplicateB con));
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3891
  format %{ "movq    $dst,[$constantaddress]\t! replicate8B($con)" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3892
  ins_encode %{
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3893
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 1)));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3894
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3895
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3896
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3897
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3898
// Replicate byte scalar zero to be vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3899
instruct Repl4B_zero(vecS dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3900
  predicate(n->as_Vector()->length() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3901
  match(Set dst (ReplicateB zero));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3902
  format %{ "pxor    $dst,$dst\t! replicate4B zero" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3903
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3904
    __ pxor($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3905
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3906
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3907
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3908
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3909
instruct Repl8B_zero(vecD dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3910
  predicate(n->as_Vector()->length() == 8);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3911
  match(Set dst (ReplicateB zero));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3912
  format %{ "pxor    $dst,$dst\t! replicate8B zero" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3913
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3914
    __ pxor($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3915
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3916
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3917
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3918
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3919
instruct Repl16B_zero(vecX dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3920
  predicate(n->as_Vector()->length() == 16);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3921
  match(Set dst (ReplicateB zero));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3922
  format %{ "pxor    $dst,$dst\t! replicate16B zero" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3923
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3924
    __ pxor($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3925
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3926
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3927
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3928
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3929
instruct Repl32B_zero(vecY dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3930
  predicate(n->as_Vector()->length() == 32);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3931
  match(Set dst (ReplicateB zero));
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3932
  format %{ "vpxor   $dst,$dst,$dst\t! replicate32B zero" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3933
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3934
    // Use vxorpd since AVX does not have vpxor for 256-bit (AVX2 will have it).
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3935
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3936
    __ vpxor($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3937
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3938
  ins_pipe( fpu_reg_reg );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3939
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3940
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3941
// Replicate char/short (2 byte) scalar to be vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3942
instruct Repl2S(vecS dst, rRegI src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3943
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3944
  match(Set dst (ReplicateS src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3945
  format %{ "movd    $dst,$src\n\t"
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3946
            "pshuflw $dst,$dst,0x00\t! replicate2S" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3947
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3948
    __ movdl($dst$$XMMRegister, $src$$Register);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3949
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3950
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3951
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3952
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3953
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3954
// Replicate char/short (2 byte) scalar immediate to be vector by loading from const table.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3955
instruct Repl2S_imm(vecS dst, immI con) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3956
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3957
  match(Set dst (ReplicateS con));
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3958
  format %{ "movdl   $dst,[$constantaddress]\t! replicate2S($con)" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3959
  ins_encode %{
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3960
    __ movdl($dst$$XMMRegister, $constantaddress(replicate4_imm($con$$constant, 2)));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3961
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3962
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3963
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3964
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3965
instruct Repl4S_imm(vecD dst, immI con) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3966
  predicate(n->as_Vector()->length() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3967
  match(Set dst (ReplicateS con));
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3968
  format %{ "movq    $dst,[$constantaddress]\t! replicate4S($con)" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3969
  ins_encode %{
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3970
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 2)));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3971
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3972
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3973
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3974
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3975
// Replicate char/short (2 byte) scalar zero to be vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3976
instruct Repl2S_zero(vecS dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3977
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3978
  match(Set dst (ReplicateS zero));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3979
  format %{ "pxor    $dst,$dst\t! replicate2S zero" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3980
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3981
    __ pxor($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3982
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3983
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3984
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3985
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3986
instruct Repl4S_zero(vecD dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3987
  predicate(n->as_Vector()->length() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3988
  match(Set dst (ReplicateS zero));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3989
  format %{ "pxor    $dst,$dst\t! replicate4S zero" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3990
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3991
    __ pxor($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3992
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3993
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3994
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3995
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3996
instruct Repl8S_zero(vecX dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3997
  predicate(n->as_Vector()->length() == 8);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3998
  match(Set dst (ReplicateS zero));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3999
  format %{ "pxor    $dst,$dst\t! replicate8S zero" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4000
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4001
    __ pxor($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4002
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4003
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4004
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4005
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4006
instruct Repl16S_zero(vecY dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4007
  predicate(n->as_Vector()->length() == 16);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4008
  match(Set dst (ReplicateS zero));
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  4009
  format %{ "vpxor   $dst,$dst,$dst\t! replicate16S zero" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4010
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4011
    // Use vxorpd since AVX does not have vpxor for 256-bit (AVX2 will have it).
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4012
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4013
    __ vpxor($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4014
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4015
  ins_pipe( fpu_reg_reg );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4016
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4017
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4018
// Replicate integer (4 byte) scalar to be vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4019
instruct Repl2I(vecD dst, rRegI src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4020
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4021
  match(Set dst (ReplicateI src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4022
  format %{ "movd    $dst,$src\n\t"
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4023
            "pshufd  $dst,$dst,0x00\t! replicate2I" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4024
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4025
    __ movdl($dst$$XMMRegister, $src$$Register);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4026
    __ pshufd($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4027
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4028
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4029
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4030
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4031
// Integer could be loaded into xmm register directly from memory.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4032
instruct Repl2I_mem(vecD dst, memory mem) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4033
  predicate(n->as_Vector()->length() == 2);
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  4034
  match(Set dst (ReplicateI (LoadI mem)));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4035
  format %{ "movd    $dst,$mem\n\t"
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4036
            "pshufd  $dst,$dst,0x00\t! replicate2I" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4037
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4038
    __ movdl($dst$$XMMRegister, $mem$$Address);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4039
    __ pshufd($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4040
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4041
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4042
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4043
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4044
// Replicate integer (4 byte) scalar immediate to be vector by loading from const table.
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4045
instruct Repl2I_imm(vecD dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4046
  predicate(n->as_Vector()->length() == 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4047
  match(Set dst (ReplicateI con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4048
  format %{ "movq    $dst,[$constantaddress]\t! replicate2I($con)" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4049
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4050
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 4)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4051
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4052
  ins_pipe( fpu_reg_reg );
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4053
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4054
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4055
// Replicate integer (4 byte) scalar zero to be vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4056
instruct Repl2I_zero(vecD dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4057
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4058
  match(Set dst (ReplicateI zero));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4059
  format %{ "pxor    $dst,$dst\t! replicate2I" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4060
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4061
    __ pxor($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4062
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4063
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4064
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4065
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4066
instruct Repl4I_zero(vecX dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4067
  predicate(n->as_Vector()->length() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4068
  match(Set dst (ReplicateI zero));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4069
  format %{ "pxor    $dst,$dst\t! replicate4I zero)" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4070
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4071
    __ pxor($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4072
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4073
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4074
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4075
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4076
instruct Repl8I_zero(vecY dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4077
  predicate(n->as_Vector()->length() == 8);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4078
  match(Set dst (ReplicateI zero));
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  4079
  format %{ "vpxor   $dst,$dst,$dst\t! replicate8I zero" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4080
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4081
    // Use vxorpd since AVX does not have vpxor for 256-bit (AVX2 will have it).
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4082
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4083
    __ vpxor($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4084
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4085
  ins_pipe( fpu_reg_reg );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4086
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4087
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4088
// Replicate long (8 byte) scalar to be vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4089
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4090
instruct Repl2L(vecX dst, rRegL src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4091
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4092
  match(Set dst (ReplicateL src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4093
  format %{ "movdq   $dst,$src\n\t"
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  4094
            "punpcklqdq $dst,$dst\t! replicate2L" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4095
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4096
    __ movdq($dst$$XMMRegister, $src$$Register);
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  4097
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4098
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4099
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4100
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4101
#else // _LP64
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4102
instruct Repl2L(vecX dst, eRegL src, vecX tmp) %{
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4103
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4104
  match(Set dst (ReplicateL src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4105
  effect(TEMP dst, USE src, TEMP tmp);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4106
  format %{ "movdl   $dst,$src.lo\n\t"
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4107
            "movdl   $tmp,$src.hi\n\t"
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4108
            "punpckldq $dst,$tmp\n\t"
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  4109
            "punpcklqdq $dst,$dst\t! replicate2L"%}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4110
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4111
    __ movdl($dst$$XMMRegister, $src$$Register);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4112
    __ movdl($tmp$$XMMRegister, HIGH_FROM_LOW($src$$Register));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4113
    __ punpckldq($dst$$XMMRegister, $tmp$$XMMRegister);
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  4114
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4115
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4116
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4117
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4118
#endif // _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4119
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4120
// Replicate long (8 byte) scalar immediate to be vector by loading from const table.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4121
instruct Repl2L_imm(vecX dst, immL con) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4122
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4123
  match(Set dst (ReplicateL con));
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  4124
  format %{ "movq    $dst,[$constantaddress]\n\t"
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  4125
            "punpcklqdq $dst,$dst\t! replicate2L($con)" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4126
  ins_encode %{
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  4127
    __ movq($dst$$XMMRegister, $constantaddress($con));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  4128
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4129
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4130
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4131
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4132
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4133
// Replicate long (8 byte) scalar zero to be vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4134
instruct Repl2L_zero(vecX dst, immL0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4135
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4136
  match(Set dst (ReplicateL zero));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4137
  format %{ "pxor    $dst,$dst\t! replicate2L zero" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4138
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4139
    __ pxor($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4140
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4141
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4142
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4143
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4144
instruct Repl4L_zero(vecY dst, immL0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4145
  predicate(n->as_Vector()->length() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4146
  match(Set dst (ReplicateL zero));
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  4147
  format %{ "vpxor   $dst,$dst,$dst\t! replicate4L zero" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4148
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4149
    // Use vxorpd since AVX does not have vpxor for 256-bit (AVX2 will have it).
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4150
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4151
    __ vpxor($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4152
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4153
  ins_pipe( fpu_reg_reg );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4154
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4155
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4156
// Replicate float (4 byte) scalar to be vector
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4157
instruct Repl2F(vecD dst, vlRegF src) %{
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4158
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4159
  match(Set dst (ReplicateF src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4160
  format %{ "pshufd  $dst,$dst,0x00\t! replicate2F" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4161
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4162
    __ pshufd($dst$$XMMRegister, $src$$XMMRegister, 0x00);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4163
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4164
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4165
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4166
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4167
instruct Repl4F(vecX dst, vlRegF src) %{
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4168
  predicate(n->as_Vector()->length() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4169
  match(Set dst (ReplicateF src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4170
  format %{ "pshufd  $dst,$dst,0x00\t! replicate4F" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4171
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4172
    __ pshufd($dst$$XMMRegister, $src$$XMMRegister, 0x00);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4173
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4174
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4175
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4176
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4177
// Replicate double (8 bytes) scalar to be vector
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4178
instruct Repl2D(vecX dst, vlRegD src) %{
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4179
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4180
  match(Set dst (ReplicateD src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4181
  format %{ "pshufd  $dst,$src,0x44\t! replicate2D" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4182
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4183
    __ pshufd($dst$$XMMRegister, $src$$XMMRegister, 0x44);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4184
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4185
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4186
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4187
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4188
// ====================EVEX REPLICATE=============================================
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4189
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4190
instruct Repl4B_mem_evex(vecS dst, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4191
  predicate(n->as_Vector()->length() == 4 && UseAVX > 2 && VM_Version::supports_avx512vlbw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4192
  match(Set dst (ReplicateB (LoadB mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4193
  format %{ "vpbroadcastb  $dst,$mem\t! replicate4B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4194
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4195
    int vector_len = 0;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4196
    __ vpbroadcastb($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4197
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4198
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4199
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4200
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4201
instruct Repl8B_mem_evex(vecD dst, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4202
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2 && VM_Version::supports_avx512vlbw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4203
  match(Set dst (ReplicateB (LoadB mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4204
  format %{ "vpbroadcastb  $dst,$mem\t! replicate8B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4205
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4206
    int vector_len = 0;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4207
    __ vpbroadcastb($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4208
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4209
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4210
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4211
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4212
instruct Repl16B_evex(vecX dst, rRegI src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4213
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2 && VM_Version::supports_avx512vlbw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4214
  match(Set dst (ReplicateB src));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4215
  format %{ "evpbroadcastb $dst,$src\t! replicate16B" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4216
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4217
   int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4218
    __ evpbroadcastb($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4219
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4220
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4221
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4222
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4223
instruct Repl16B_mem_evex(vecX dst, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4224
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2 && VM_Version::supports_avx512vlbw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4225
  match(Set dst (ReplicateB (LoadB mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4226
  format %{ "vpbroadcastb  $dst,$mem\t! replicate16B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4227
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4228
    int vector_len = 0;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4229
    __ vpbroadcastb($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4230
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4231
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4232
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4233
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4234
instruct Repl32B_evex(vecY dst, rRegI src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4235
  predicate(n->as_Vector()->length() == 32 && UseAVX > 2 && VM_Version::supports_avx512vlbw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4236
  match(Set dst (ReplicateB src));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4237
  format %{ "evpbroadcastb $dst,$src\t! replicate32B" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4238
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4239
   int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4240
    __ evpbroadcastb($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4241
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4242
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4243
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4244
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4245
instruct Repl32B_mem_evex(vecY dst, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4246
  predicate(n->as_Vector()->length() == 32 && UseAVX > 2 && VM_Version::supports_avx512vlbw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4247
  match(Set dst (ReplicateB (LoadB mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4248
  format %{ "vpbroadcastb  $dst,$mem\t! replicate32B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4249
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4250
    int vector_len = 1;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4251
    __ vpbroadcastb($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4252
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4253
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4254
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4255
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4256
instruct Repl64B_evex(vecZ dst, rRegI src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4257
  predicate(n->as_Vector()->length() == 64 && UseAVX > 2 && VM_Version::supports_avx512bw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4258
  match(Set dst (ReplicateB src));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4259
  format %{ "evpbroadcastb $dst,$src\t! upper replicate64B" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4260
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4261
   int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4262
    __ evpbroadcastb($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4263
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4264
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4265
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4266
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4267
instruct Repl64B_mem_evex(vecZ dst, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4268
  predicate(n->as_Vector()->length() == 64 && UseAVX > 2 && VM_Version::supports_avx512bw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4269
  match(Set dst (ReplicateB (LoadB mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4270
  format %{ "vpbroadcastb  $dst,$mem\t! replicate64B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4271
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4272
    int vector_len = 2;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4273
    __ vpbroadcastb($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4274
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4275
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4276
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4277
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4278
instruct Repl16B_imm_evex(vecX dst, immI con) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4279
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2 && VM_Version::supports_avx512vlbw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4280
  match(Set dst (ReplicateB con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4281
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4282
            "vpbroadcastb $dst,$dst\t! replicate16B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4283
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4284
   int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4285
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 1)));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4286
    __ vpbroadcastb($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4287
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4288
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4289
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4290
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4291
instruct Repl32B_imm_evex(vecY dst, immI con) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4292
  predicate(n->as_Vector()->length() == 32 && UseAVX > 2 && VM_Version::supports_avx512vlbw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4293
  match(Set dst (ReplicateB con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4294
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4295
            "vpbroadcastb $dst,$dst\t! replicate32B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4296
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4297
   int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4298
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 1)));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4299
    __ vpbroadcastb($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4300
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4301
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4302
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4303
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4304
instruct Repl64B_imm_evex(vecZ dst, immI con) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4305
  predicate(n->as_Vector()->length() == 64 && UseAVX > 2 && VM_Version::supports_avx512bw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4306
  match(Set dst (ReplicateB con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4307
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4308
            "vpbroadcastb $dst,$dst\t! upper replicate64B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4309
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4310
   int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4311
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 1)));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4312
    __ vpbroadcastb($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4313
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4314
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4315
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4316
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4317
instruct Repl64B_zero_evex(vecZ dst, immI0 zero) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4318
  predicate(n->as_Vector()->length() == 64 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4319
  match(Set dst (ReplicateB zero));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4320
  format %{ "vpxor   $dst k0,$dst,$dst\t! replicate64B zero" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4321
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4322
    // Use vxorpd since AVX does not have vpxor for 512-bit (EVEX will have it).
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4323
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4324
    __ vpxor($dst$$XMMRegister,$dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4325
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4326
  ins_pipe( fpu_reg_reg );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4327
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4328
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4329
instruct Repl4S_evex(vecD dst, rRegI src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4330
  predicate(n->as_Vector()->length() == 4 && UseAVX > 2 && VM_Version::supports_avx512vlbw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4331
  match(Set dst (ReplicateS src));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4332
  format %{ "evpbroadcastw $dst,$src\t! replicate4S" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4333
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4334
   int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4335
    __ evpbroadcastw($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4336
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4337
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4338
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4339
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4340
instruct Repl4S_mem_evex(vecD dst, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4341
  predicate(n->as_Vector()->length() == 4 && UseAVX > 2 && VM_Version::supports_avx512vlbw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4342
  match(Set dst (ReplicateS (LoadS mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4343
  format %{ "vpbroadcastw  $dst,$mem\t! replicate4S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4344
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4345
    int vector_len = 0;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4346
    __ vpbroadcastw($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4347
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4348
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4349
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4350
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4351
instruct Repl8S_evex(vecX dst, rRegI src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4352
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2 && VM_Version::supports_avx512vlbw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4353
  match(Set dst (ReplicateS src));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4354
  format %{ "evpbroadcastw $dst,$src\t! replicate8S" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4355
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4356
   int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4357
    __ evpbroadcastw($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4358
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4359
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4360
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4361
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4362
instruct Repl8S_mem_evex(vecX dst, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4363
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2 && VM_Version::supports_avx512vlbw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4364
  match(Set dst (ReplicateS (LoadS mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4365
  format %{ "vpbroadcastw  $dst,$mem\t! replicate8S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4366
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4367
    int vector_len = 0;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4368
    __ vpbroadcastw($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4369
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4370
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4371
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4372
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4373
instruct Repl16S_evex(vecY dst, rRegI src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4374
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2 && VM_Version::supports_avx512vlbw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4375
  match(Set dst (ReplicateS src));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4376
  format %{ "evpbroadcastw $dst,$src\t! replicate16S" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4377
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4378
   int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4379
    __ evpbroadcastw($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4380
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4381
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4382
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4383
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4384
instruct Repl16S_mem_evex(vecY dst, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4385
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2 && VM_Version::supports_avx512vlbw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4386
  match(Set dst (ReplicateS (LoadS mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4387
  format %{ "vpbroadcastw  $dst,$mem\t! replicate16S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4388
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4389
    int vector_len = 1;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4390
    __ vpbroadcastw($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4391
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4392
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4393
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4394
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4395
instruct Repl32S_evex(vecZ dst, rRegI src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4396
  predicate(n->as_Vector()->length() == 32 && UseAVX > 2 && VM_Version::supports_avx512bw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4397
  match(Set dst (ReplicateS src));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4398
  format %{ "evpbroadcastw $dst,$src\t! replicate32S" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4399
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4400
   int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4401
    __ evpbroadcastw($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4402
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4403
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4404
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4405
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4406
instruct Repl32S_mem_evex(vecZ dst, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4407
  predicate(n->as_Vector()->length() == 32 && UseAVX > 2 && VM_Version::supports_avx512bw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4408
  match(Set dst (ReplicateS (LoadS mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4409
  format %{ "vpbroadcastw  $dst,$mem\t! replicate32S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4410
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4411
    int vector_len = 2;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4412
    __ vpbroadcastw($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4413
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4414
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4415
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4416
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4417
instruct Repl8S_imm_evex(vecX dst, immI con) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4418
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2 && VM_Version::supports_avx512vlbw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4419
  match(Set dst (ReplicateS con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4420
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4421
            "vpbroadcastw $dst,$dst\t! replicate8S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4422
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4423
   int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4424
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 2)));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4425
    __ vpbroadcastw($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4426
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4427
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4428
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4429
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4430
instruct Repl16S_imm_evex(vecY dst, immI con) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4431
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2 && VM_Version::supports_avx512vlbw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4432
  match(Set dst (ReplicateS con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4433
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4434
            "vpbroadcastw $dst,$dst\t! replicate16S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4435
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4436
   int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4437
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 2)));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4438
    __ vpbroadcastw($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4439
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4440
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4441
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4442
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4443
instruct Repl32S_imm_evex(vecZ dst, immI con) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4444
  predicate(n->as_Vector()->length() == 32 && UseAVX > 2 && VM_Version::supports_avx512bw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4445
  match(Set dst (ReplicateS con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4446
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4447
            "vpbroadcastw $dst,$dst\t! replicate32S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4448
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4449
   int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4450
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 2)));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4451
    __ vpbroadcastw($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4452
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4453
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4454
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4455
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4456
instruct Repl32S_zero_evex(vecZ dst, immI0 zero) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4457
  predicate(n->as_Vector()->length() == 32 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4458
  match(Set dst (ReplicateS zero));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4459
  format %{ "vpxor   $dst k0,$dst,$dst\t! replicate32S zero" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4460
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4461
    // Use vxorpd since AVX does not have vpxor for 512-bit (EVEX will have it).
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4462
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4463
    __ vpxor($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4464
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4465
  ins_pipe( fpu_reg_reg );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4466
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4467
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4468
instruct Repl4I_evex(vecX dst, rRegI src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4469
  predicate(n->as_Vector()->length() == 4 && UseAVX > 2 && VM_Version::supports_avx512vl());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4470
  match(Set dst (ReplicateI src));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4471
  format %{ "evpbroadcastd  $dst,$src\t! replicate4I" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4472
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4473
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4474
    __ evpbroadcastd($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4475
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4476
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4477
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4478
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4479
instruct Repl4I_mem_evex(vecX dst, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4480
  predicate(n->as_Vector()->length() == 4 && UseAVX > 2 && VM_Version::supports_avx512vl());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4481
  match(Set dst (ReplicateI (LoadI mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4482
  format %{ "vpbroadcastd  $dst,$mem\t! replicate4I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4483
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4484
    int vector_len = 0;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4485
    __ vpbroadcastd($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4486
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4487
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4488
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4489
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4490
instruct Repl8I_evex(vecY dst, rRegI src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4491
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2 && VM_Version::supports_avx512vl());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4492
  match(Set dst (ReplicateI src));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4493
  format %{ "evpbroadcastd  $dst,$src\t! replicate8I" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4494
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4495
    int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4496
    __ evpbroadcastd($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4497
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4498
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4499
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4500
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4501
instruct Repl8I_mem_evex(vecY dst, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4502
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2 && VM_Version::supports_avx512vl());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4503
  match(Set dst (ReplicateI (LoadI mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4504
  format %{ "vpbroadcastd  $dst,$mem\t! replicate8I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4505
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4506
    int vector_len = 1;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4507
    __ vpbroadcastd($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4508
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4509
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4510
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4511
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4512
instruct Repl16I_evex(vecZ dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4513
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4514
  match(Set dst (ReplicateI src));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4515
  format %{ "evpbroadcastd  $dst,$src\t! replicate16I" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4516
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4517
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4518
    __ evpbroadcastd($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4519
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4520
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4521
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4522
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4523
instruct Repl16I_mem_evex(vecZ dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4524
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4525
  match(Set dst (ReplicateI (LoadI mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4526
  format %{ "vpbroadcastd  $dst,$mem\t! replicate16I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4527
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4528
    int vector_len = 2;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4529
    __ vpbroadcastd($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4530
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4531
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4532
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4533
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4534
instruct Repl4I_imm_evex(vecX dst, immI con) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4535
  predicate(n->as_Vector()->length() == 4 && UseAVX > 2 && VM_Version::supports_avx512vl());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4536
  match(Set dst (ReplicateI con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4537
  format %{ "movq    $dst,[$constantaddress]\t! replicate8I($con)\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4538
            "vpbroadcastd  $dst,$dst\t! replicate4I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4539
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4540
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4541
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 4)));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4542
    __ vpbroadcastd($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4543
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4544
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4545
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4546
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4547
instruct Repl8I_imm_evex(vecY dst, immI con) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4548
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2 && VM_Version::supports_avx512vl());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4549
  match(Set dst (ReplicateI con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4550
  format %{ "movq    $dst,[$constantaddress]\t! replicate8I($con)\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4551
            "vpbroadcastd  $dst,$dst\t! replicate8I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4552
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4553
    int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4554
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 4)));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4555
    __ vpbroadcastd($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4556
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4557
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4558
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4559
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4560
instruct Repl16I_imm_evex(vecZ dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4561
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4562
  match(Set dst (ReplicateI con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4563
  format %{ "movq    $dst,[$constantaddress]\t! replicate16I($con)\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4564
            "vpbroadcastd  $dst,$dst\t! replicate16I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4565
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4566
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4567
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 4)));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4568
    __ vpbroadcastd($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4569
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4570
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4571
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4572
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4573
instruct Repl16I_zero_evex(vecZ dst, immI0 zero) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4574
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4575
  match(Set dst (ReplicateI zero));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4576
  format %{ "vpxor   $dst k0,$dst,$dst\t! replicate16I zero" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4577
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4578
    // Use vxorpd since AVX does not have vpxor for 512-bit (AVX2 will have it).
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4579
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4580
    __ vpxor($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4581
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4582
  ins_pipe( fpu_reg_reg );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4583
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4584
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4585
// Replicate long (8 byte) scalar to be vector
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4586
#ifdef _LP64
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4587
instruct Repl4L_evex(vecY dst, rRegL src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4588
  predicate(n->as_Vector()->length() == 4 && UseAVX > 2 && VM_Version::supports_avx512vl());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4589
  match(Set dst (ReplicateL src));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4590
  format %{ "evpbroadcastq  $dst,$src\t! replicate4L" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4591
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4592
    int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4593
    __ evpbroadcastq($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4594
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4595
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4596
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4597
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4598
instruct Repl8L_evex(vecZ dst, rRegL src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4599
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4600
  match(Set dst (ReplicateL src));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4601
  format %{ "evpbroadcastq  $dst,$src\t! replicate8L" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4602
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4603
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4604
    __ evpbroadcastq($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4605
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4606
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4607
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4608
#else // _LP64
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4609
instruct Repl4L_evex(vecY dst, eRegL src, regD tmp) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4610
  predicate(n->as_Vector()->length() == 4 && UseAVX > 2 && VM_Version::supports_avx512vl());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4611
  match(Set dst (ReplicateL src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4612
  effect(TEMP dst, USE src, TEMP tmp);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4613
  format %{ "movdl   $dst,$src.lo\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4614
            "movdl   $tmp,$src.hi\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4615
            "punpckldq $dst,$tmp\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4616
            "vpbroadcastq  $dst,$dst\t! replicate4L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4617
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4618
    int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4619
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4620
    __ movdl($tmp$$XMMRegister, HIGH_FROM_LOW($src$$Register));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4621
    __ punpckldq($dst$$XMMRegister, $tmp$$XMMRegister);
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4622
    __ vpbroadcastq($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4623
  %}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4624
  ins_pipe( pipe_slow );
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4625
%}
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4626
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4627
instruct Repl8L_evex(legVecZ dst, eRegL src, legVecZ tmp) %{
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4628
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4629
  match(Set dst (ReplicateL src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4630
  effect(TEMP dst, USE src, TEMP tmp);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4631
  format %{ "movdl   $dst,$src.lo\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4632
            "movdl   $tmp,$src.hi\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4633
            "punpckldq $dst,$tmp\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4634
            "vpbroadcastq  $dst,$dst\t! replicate8L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4635
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4636
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4637
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4638
    __ movdl($tmp$$XMMRegister, HIGH_FROM_LOW($src$$Register));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4639
    __ punpckldq($dst$$XMMRegister, $tmp$$XMMRegister);
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4640
    __ vpbroadcastq($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4641
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4642
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4643
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4644
#endif // _LP64
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4645
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4646
instruct Repl4L_imm_evex(vecY dst, immL con) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4647
  predicate(n->as_Vector()->length() == 4 && UseAVX > 2 && VM_Version::supports_avx512vl());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4648
  match(Set dst (ReplicateL con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4649
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4650
            "vpbroadcastq  $dst,$dst\t! replicate4L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4651
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4652
    int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4653
    __ movq($dst$$XMMRegister, $constantaddress($con));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4654
    __ vpbroadcastq($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4655
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4656
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4657
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4658
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4659
instruct Repl8L_imm_evex(vecZ dst, immL con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4660
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4661
  match(Set dst (ReplicateL con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4662
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4663
            "vpbroadcastq  $dst,$dst\t! replicate8L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4664
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4665
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4666
    __ movq($dst$$XMMRegister, $constantaddress($con));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4667
    __ vpbroadcastq($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4668
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4669
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4670
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4671
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4672
instruct Repl2L_mem_evex(vecX dst, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4673
  predicate(n->as_Vector()->length() == 2 && UseAVX > 2 && VM_Version::supports_avx512vl());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4674
  match(Set dst (ReplicateL (LoadL mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4675
  format %{ "vpbroadcastd  $dst,$mem\t! replicate2L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4676
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4677
    int vector_len = 0;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4678
    __ vpbroadcastq($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4679
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4680
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4681
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4682
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4683
instruct Repl4L_mem_evex(vecY dst, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4684
  predicate(n->as_Vector()->length() == 4 && UseAVX > 2 && VM_Version::supports_avx512vl());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4685
  match(Set dst (ReplicateL (LoadL mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4686
  format %{ "vpbroadcastd  $dst,$mem\t! replicate4L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4687
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4688
    int vector_len = 1;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4689
    __ vpbroadcastq($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4690
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4691
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4692
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4693
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4694
instruct Repl8L_mem_evex(vecZ dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4695
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4696
  match(Set dst (ReplicateL (LoadL mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4697
  format %{ "vpbroadcastd  $dst,$mem\t! replicate8L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4698
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4699
    int vector_len = 2;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4700
    __ vpbroadcastq($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4701
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4702
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4703
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4704
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4705
instruct Repl8L_zero_evex(vecZ dst, immL0 zero) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4706
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4707
  match(Set dst (ReplicateL zero));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4708
  format %{ "vpxor   $dst k0,$dst,$dst\t! replicate8L zero" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4709
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4710
    // Use vxorpd since AVX does not have vpxor for 512-bit (EVEX will have it).
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4711
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4712
    __ vpxor($dst$$XMMRegister,$dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4713
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4714
  ins_pipe( fpu_reg_reg );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4715
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4716
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4717
instruct Repl8F_evex(vecY dst, regF src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4718
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2 && VM_Version::supports_avx512vl());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4719
  match(Set dst (ReplicateF src));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4720
  format %{ "vpbroadcastss $dst,$src\t! replicate8F" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4721
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4722
    int vector_len = 1;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4723
    __ vpbroadcastss($dst$$XMMRegister, $src$$XMMRegister, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4724
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4725
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4726
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4727
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4728
instruct Repl8F_mem_evex(vecY dst, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4729
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2 && VM_Version::supports_avx512vl());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4730
  match(Set dst (ReplicateF (LoadF mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4731
  format %{ "vbroadcastss  $dst,$mem\t! replicate8F" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4732
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4733
    int vector_len = 1;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4734
    __ vpbroadcastss($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4735
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4736
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4737
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4738
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4739
instruct Repl16F_evex(vecZ dst, regF src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4740
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4741
  match(Set dst (ReplicateF src));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4742
  format %{ "vpbroadcastss $dst,$src\t! replicate16F" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4743
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4744
    int vector_len = 2;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4745
    __ vpbroadcastss($dst$$XMMRegister, $src$$XMMRegister, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4746
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4747
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4748
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4749
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4750
instruct Repl16F_mem_evex(vecZ dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4751
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4752
  match(Set dst (ReplicateF (LoadF mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4753
  format %{ "vbroadcastss  $dst,$mem\t! replicate16F" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4754
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4755
    int vector_len = 2;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4756
    __ vpbroadcastss($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4757
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4758
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4759
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4760
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4761
instruct Repl16F_zero_evex(vecZ dst, immF0 zero) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4762
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4763
  match(Set dst (ReplicateF zero));
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4764
  format %{ "vpxor  $dst k0,$dst,$dst\t! replicate16F zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4765
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4766
    // Use vpxor in place of vxorps since EVEX has a constriant on dq for vxorps: this is a 512-bit operation
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4767
    int vector_len = 2;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4768
    __ vpxor($dst$$XMMRegister,$dst$$XMMRegister, $dst$$XMMRegister, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4769
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4770
  ins_pipe( fpu_reg_reg );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4771
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4772
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4773
instruct Repl4D_evex(vecY dst, regD src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4774
  predicate(n->as_Vector()->length() == 4 && UseAVX > 2 && VM_Version::supports_avx512vl());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4775
  match(Set dst (ReplicateD src));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4776
  format %{ "vpbroadcastsd $dst,$src\t! replicate4D" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4777
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4778
    int vector_len = 1;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4779
    __ vpbroadcastsd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4780
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4781
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4782
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4783
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4784
instruct Repl4D_mem_evex(vecY dst, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4785
  predicate(n->as_Vector()->length() == 4 && UseAVX > 2 && VM_Version::supports_avx512vl());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4786
  match(Set dst (ReplicateD (LoadD mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4787
  format %{ "vbroadcastsd  $dst,$mem\t! replicate4D" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4788
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4789
    int vector_len = 1;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4790
    __ vpbroadcastsd($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4791
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4792
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4793
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4794
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4795
instruct Repl8D_evex(vecZ dst, regD src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4796
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4797
  match(Set dst (ReplicateD src));
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4798
  format %{ "vpbroadcastsd $dst,$src\t! replicate8D" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4799
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4800
    int vector_len = 2;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4801
    __ vpbroadcastsd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4802
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4803
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4804
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4805
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4806
instruct Repl8D_mem_evex(vecZ dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4807
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4808
  match(Set dst (ReplicateD (LoadD mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4809
  format %{ "vbroadcastsd  $dst,$mem\t! replicate8D" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4810
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4811
    int vector_len = 2;
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4812
    __ vpbroadcastsd($dst$$XMMRegister, $mem$$Address, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4813
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4814
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4815
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4816
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4817
instruct Repl8D_zero_evex(vecZ dst, immD0 zero) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4818
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4819
  match(Set dst (ReplicateD zero));
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4820
  format %{ "vpxor  $dst k0,$dst,$dst,vect512\t! replicate8D zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4821
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4822
    // Use vpxor in place of vxorpd since EVEX has a constriant on dq for vxorpd: this is a 512-bit operation
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4823
    int vector_len = 2;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4824
    __ vpxor($dst$$XMMRegister,$dst$$XMMRegister, $dst$$XMMRegister, vector_len);
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4825
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4826
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4827
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4828
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4829
// ====================REDUCTION ARITHMETIC=======================================
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4830
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4831
instruct rsadd2I_reduction_reg(rRegI dst, rRegI src1, vecD src2, vecD tmp, vecD tmp2) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4832
  predicate(UseSSE > 2 && UseAVX == 0);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4833
  match(Set dst (AddReductionVI src1 src2));
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4834
  effect(TEMP tmp2, TEMP tmp);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4835
  format %{ "movdqu  $tmp2,$src2\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4836
            "phaddd  $tmp2,$tmp2\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4837
            "movd    $tmp,$src1\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4838
            "paddd   $tmp,$tmp2\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4839
            "movd    $dst,$tmp\t! add reduction2I" %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4840
  ins_encode %{
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4841
    __ movdqu($tmp2$$XMMRegister, $src2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4842
    __ phaddd($tmp2$$XMMRegister, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4843
    __ movdl($tmp$$XMMRegister, $src1$$Register);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4844
    __ paddd($tmp$$XMMRegister, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4845
    __ movdl($dst$$Register, $tmp$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4846
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4847
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4848
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4849
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4850
instruct rvadd2I_reduction_reg(rRegI dst, rRegI src1, vecD src2, vecD tmp, vecD tmp2) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4851
  predicate(VM_Version::supports_avxonly());
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4852
  match(Set dst (AddReductionVI src1 src2));
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4853
  effect(TEMP tmp, TEMP tmp2);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4854
  format %{ "vphaddd  $tmp,$src2,$src2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4855
            "movd     $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4856
            "vpaddd   $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4857
            "movd     $dst,$tmp2\t! add reduction2I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4858
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4859
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4860
    __ vphaddd($tmp$$XMMRegister, $src2$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4861
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4862
    __ vpaddd($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4863
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4864
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4865
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4866
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4867
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4868
instruct rvadd2I_reduction_reg_evex(rRegI dst, rRegI src1, vecD src2, vecD tmp, vecD tmp2) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4869
  predicate(UseAVX > 2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4870
  match(Set dst (AddReductionVI src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4871
  effect(TEMP tmp, TEMP tmp2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4872
  format %{ "pshufd  $tmp2,$src2,0x1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4873
            "vpaddd  $tmp,$src2,$tmp2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4874
            "movd    $tmp2,$src1\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4875
            "vpaddd  $tmp2,$tmp,$tmp2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4876
            "movd    $dst,$tmp2\t! add reduction2I" %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4877
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4878
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4879
    __ pshufd($tmp2$$XMMRegister, $src2$$XMMRegister, 0x1);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4880
    __ vpaddd($tmp$$XMMRegister, $src2$$XMMRegister, $tmp2$$XMMRegister, vector_len);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4881
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4882
    __ vpaddd($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4883
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4884
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4885
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4886
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4887
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4888
instruct rsadd4I_reduction_reg(rRegI dst, rRegI src1, vecX src2, vecX tmp, vecX tmp2) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4889
  predicate(UseSSE > 2 && UseAVX == 0);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4890
  match(Set dst (AddReductionVI src1 src2));
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4891
  effect(TEMP tmp, TEMP tmp2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4892
  format %{ "movdqu  $tmp,$src2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4893
            "phaddd  $tmp,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4894
            "phaddd  $tmp,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4895
            "movd    $tmp2,$src1\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4896
            "paddd   $tmp2,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4897
            "movd    $dst,$tmp2\t! add reduction4I" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4898
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4899
    __ movdqu($tmp$$XMMRegister, $src2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4900
    __ phaddd($tmp$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4901
    __ phaddd($tmp$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4902
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4903
    __ paddd($tmp2$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4904
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4905
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4906
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4907
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4908
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4909
instruct rvadd4I_reduction_reg(rRegI dst, rRegI src1, vecX src2, vecX tmp, vecX tmp2) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4910
  predicate(VM_Version::supports_avxonly());
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4911
  match(Set dst (AddReductionVI src1 src2));
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4912
  effect(TEMP tmp, TEMP tmp2);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4913
  format %{ "vphaddd  $tmp,$src2,$src2\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4914
            "vphaddd  $tmp,$tmp,$tmp\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4915
            "movd     $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4916
            "vpaddd   $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4917
            "movd     $dst,$tmp2\t! add reduction4I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4918
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4919
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4920
    __ vphaddd($tmp$$XMMRegister, $src2$$XMMRegister, $src2$$XMMRegister, vector_len);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4921
    __ vphaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp$$XMMRegister, vector_len);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4922
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4923
    __ vpaddd($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4924
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4925
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4926
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4927
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4928
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4929
instruct rvadd4I_reduction_reg_evex(rRegI dst, rRegI src1, vecX src2, vecX tmp, vecX tmp2) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4930
  predicate(UseAVX > 2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4931
  match(Set dst (AddReductionVI src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4932
  effect(TEMP tmp, TEMP tmp2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4933
  format %{ "pshufd  $tmp2,$src2,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4934
            "vpaddd  $tmp,$src2,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4935
            "pshufd  $tmp2,$tmp,0x1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4936
            "vpaddd  $tmp,$tmp,$tmp2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4937
            "movd    $tmp2,$src1\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4938
            "vpaddd  $tmp2,$tmp,$tmp2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4939
            "movd    $dst,$tmp2\t! add reduction4I" %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4940
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4941
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4942
    __ pshufd($tmp2$$XMMRegister, $src2$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4943
    __ vpaddd($tmp$$XMMRegister, $src2$$XMMRegister, $tmp2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4944
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0x1);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4945
    __ vpaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4946
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4947
    __ vpaddd($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4948
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4949
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4950
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4951
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4952
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4953
instruct rvadd8I_reduction_reg(rRegI dst, rRegI src1, vecY src2, vecY tmp, vecY tmp2) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4954
  predicate(VM_Version::supports_avxonly());
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4955
  match(Set dst (AddReductionVI src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4956
  effect(TEMP tmp, TEMP tmp2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4957
  format %{ "vphaddd  $tmp,$src2,$src2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4958
            "vphaddd  $tmp,$tmp,$tmp2\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4959
            "vextracti128_high  $tmp2,$tmp\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4960
            "vpaddd   $tmp,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4961
            "movd     $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4962
            "vpaddd   $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4963
            "movd     $dst,$tmp2\t! add reduction8I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4964
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4965
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4966
    __ vphaddd($tmp$$XMMRegister, $src2$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4967
    __ vphaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4968
    __ vextracti128_high($tmp2$$XMMRegister, $tmp$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4969
    __ vpaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4970
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4971
    __ vpaddd($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4972
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4973
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4974
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4975
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4976
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  4977
instruct rvadd8I_reduction_reg_evex(rRegI dst, rRegI src1, vecY src2, vecY tmp, vecY tmp2) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4978
  predicate(UseAVX > 2);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4979
  match(Set dst (AddReductionVI src1 src2));
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4980
  effect(TEMP tmp, TEMP tmp2);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4981
  format %{ "vextracti128_high  $tmp,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4982
            "vpaddd  $tmp,$tmp,$src2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4983
            "pshufd  $tmp2,$tmp,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4984
            "vpaddd  $tmp,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4985
            "pshufd  $tmp2,$tmp,0x1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4986
            "vpaddd  $tmp,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4987
            "movd    $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4988
            "vpaddd  $tmp2,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4989
            "movd    $dst,$tmp2\t! add reduction8I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4990
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4991
    int vector_len = 0;
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4992
    __ vextracti128_high($tmp$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4993
    __ vpaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4994
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4995
    __ vpaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4996
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0x1);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4997
    __ vpaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4998
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4999
    __ vpaddd($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5000
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5001
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5002
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5003
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5004
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5005
instruct rvadd16I_reduction_reg_evex(rRegI dst, rRegI src1, legVecZ src2, legVecZ tmp, legVecZ tmp2, legVecZ tmp3) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5006
  predicate(UseAVX > 2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5007
  match(Set dst (AddReductionVI src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5008
  effect(TEMP tmp, TEMP tmp2, TEMP tmp3);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5009
  format %{ "vextracti64x4_high  $tmp3,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5010
            "vpaddd  $tmp3,$tmp3,$src2\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5011
            "vextracti128_high  $tmp,$tmp3\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5012
            "vpaddd  $tmp,$tmp,$tmp3\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5013
            "pshufd  $tmp2,$tmp,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5014
            "vpaddd  $tmp,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5015
            "pshufd  $tmp2,$tmp,0x1\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5016
            "vpaddd  $tmp,$tmp,$tmp2\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5017
            "movd    $tmp2,$src1\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5018
            "vpaddd  $tmp2,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5019
            "movd    $dst,$tmp2\t! mul reduction16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5020
  ins_encode %{
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5021
    __ vextracti64x4_high($tmp3$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5022
    __ vpaddd($tmp3$$XMMRegister, $tmp3$$XMMRegister, $src2$$XMMRegister, 1);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5023
    __ vextracti128_high($tmp$$XMMRegister, $tmp3$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5024
    __ vpaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp3$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5025
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5026
    __ vpaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5027
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0x1);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5028
    __ vpaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, 0);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5029
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5030
    __ vpaddd($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, 0);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5031
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5032
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5033
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5034
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5035
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5036
#ifdef _LP64
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5037
instruct rvadd2L_reduction_reg(rRegL dst, rRegL src1, vecX src2, vecX tmp, vecX tmp2) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5038
  predicate(UseAVX > 2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5039
  match(Set dst (AddReductionVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5040
  effect(TEMP tmp, TEMP tmp2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5041
  format %{ "pshufd  $tmp2,$src2,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5042
            "vpaddq  $tmp,$src2,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5043
            "movdq   $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5044
            "vpaddq  $tmp2,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5045
            "movdq   $dst,$tmp2\t! add reduction2L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5046
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5047
    __ pshufd($tmp2$$XMMRegister, $src2$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5048
    __ vpaddq($tmp$$XMMRegister, $src2$$XMMRegister, $tmp2$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5049
    __ movdq($tmp2$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5050
    __ vpaddq($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5051
    __ movdq($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5052
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5053
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5054
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5055
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5056
instruct rvadd4L_reduction_reg(rRegL dst, rRegL src1, vecY src2, vecY tmp, vecY tmp2) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5057
  predicate(UseAVX > 2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5058
  match(Set dst (AddReductionVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5059
  effect(TEMP tmp, TEMP tmp2);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5060
  format %{ "vextracti128_high  $tmp,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5061
            "vpaddq  $tmp2,$tmp,$src2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5062
            "pshufd  $tmp,$tmp2,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5063
            "vpaddq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5064
            "movdq   $tmp,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5065
            "vpaddq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5066
            "movdq   $dst,$tmp2\t! add reduction4L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5067
  ins_encode %{
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5068
    __ vextracti128_high($tmp$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5069
    __ vpaddq($tmp2$$XMMRegister, $tmp$$XMMRegister, $src2$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5070
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5071
    __ vpaddq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5072
    __ movdq($tmp$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5073
    __ vpaddq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5074
    __ movdq($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5075
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5076
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5077
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5078
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5079
instruct rvadd8L_reduction_reg(rRegL dst, rRegL src1, legVecZ src2, legVecZ tmp, legVecZ tmp2) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5080
  predicate(UseAVX > 2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5081
  match(Set dst (AddReductionVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5082
  effect(TEMP tmp, TEMP tmp2);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5083
  format %{ "vextracti64x4_high  $tmp2,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5084
            "vpaddq  $tmp2,$tmp2,$src2\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5085
            "vextracti128_high  $tmp,$tmp2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5086
            "vpaddq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5087
            "pshufd  $tmp,$tmp2,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5088
            "vpaddq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5089
            "movdq   $tmp,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5090
            "vpaddq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5091
            "movdq   $dst,$tmp2\t! add reduction8L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5092
  ins_encode %{
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5093
    __ vextracti64x4_high($tmp2$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5094
    __ vpaddq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $src2$$XMMRegister, 1);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5095
    __ vextracti128_high($tmp$$XMMRegister, $tmp2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5096
    __ vpaddq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5097
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5098
    __ vpaddq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5099
    __ movdq($tmp$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5100
    __ vpaddq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5101
    __ movdq($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5102
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5103
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5104
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5105
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5106
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5107
instruct rsadd2F_reduction_reg(regF dst, vecD src2, vecD tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5108
  predicate(UseSSE >= 1 && UseAVX == 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5109
  match(Set dst (AddReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5110
  effect(TEMP dst, TEMP tmp);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5111
  format %{ "addss   $dst,$src2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5112
            "pshufd  $tmp,$src2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5113
            "addss   $dst,$tmp\t! add reduction2F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5114
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5115
    __ addss($dst$$XMMRegister, $src2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5116
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5117
    __ addss($dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5118
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5119
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5120
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5121
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5122
instruct rvadd2F_reduction_reg(regF dst, vecD src2, vecD tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5123
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5124
  match(Set dst (AddReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5125
  effect(TEMP dst, TEMP tmp);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5126
  format %{ "vaddss  $dst,$dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5127
            "pshufd  $tmp,$src2,0x01\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5128
            "vaddss  $dst,$dst,$tmp\t! add reduction2F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5129
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5130
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5131
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5132
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5133
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5134
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5135
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5136
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5137
instruct rsadd4F_reduction_reg(regF dst, vecX src2, vecX tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5138
  predicate(UseSSE >= 1 && UseAVX == 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5139
  match(Set dst (AddReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5140
  effect(TEMP dst, TEMP tmp);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5141
  format %{ "addss   $dst,$src2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5142
            "pshufd  $tmp,$src2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5143
            "addss   $dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5144
            "pshufd  $tmp,$src2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5145
            "addss   $dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5146
            "pshufd  $tmp,$src2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5147
            "addss   $dst,$tmp\t! add reduction4F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5148
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5149
    __ addss($dst$$XMMRegister, $src2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5150
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5151
    __ addss($dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5152
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5153
    __ addss($dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5154
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5155
    __ addss($dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5156
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5157
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5158
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5159
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5160
instruct rvadd4F_reduction_reg(regF dst, vecX src2, vecX tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5161
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5162
  match(Set dst (AddReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5163
  effect(TEMP tmp, TEMP dst);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5164
  format %{ "vaddss  $dst,dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5165
            "pshufd  $tmp,$src2,0x01\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5166
            "vaddss  $dst,$dst,$tmp\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5167
            "pshufd  $tmp,$src2,0x02\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5168
            "vaddss  $dst,$dst,$tmp\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5169
            "pshufd  $tmp,$src2,0x03\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5170
            "vaddss  $dst,$dst,$tmp\t! add reduction4F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5171
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5172
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5173
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5174
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5175
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x02);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5176
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5177
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x03);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5178
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5179
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5180
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5181
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5182
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5183
instruct radd8F_reduction_reg(regF dst, vecY src2, vecY tmp, vecY tmp2) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5184
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5185
  match(Set dst (AddReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5186
  effect(TEMP tmp, TEMP dst, TEMP tmp2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5187
  format %{ "vaddss  $dst,$dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5188
            "pshufd  $tmp,$src2,0x01\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5189
            "vaddss  $dst,$dst,$tmp\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5190
            "pshufd  $tmp,$src2,0x02\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5191
            "vaddss  $dst,$dst,$tmp\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5192
            "pshufd  $tmp,$src2,0x03\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5193
            "vaddss  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5194
            "vextractf128_high  $tmp2,$src2\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5195
            "vaddss  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5196
            "pshufd  $tmp,$tmp2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5197
            "vaddss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5198
            "pshufd  $tmp,$tmp2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5199
            "vaddss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5200
            "pshufd  $tmp,$tmp2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5201
            "vaddss  $dst,$dst,$tmp\t! add reduction8F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5202
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5203
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5204
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5205
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5206
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x02);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5207
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5208
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x03);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5209
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5210
    __ vextractf128_high($tmp2$$XMMRegister, $src2$$XMMRegister);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5211
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5212
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5213
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5214
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5215
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5216
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5217
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5218
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5219
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5220
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5221
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5222
instruct radd16F_reduction_reg(regF dst, legVecZ src2, legVecZ tmp, legVecZ tmp2) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5223
  predicate(UseAVX > 2);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5224
  match(Set dst (AddReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5225
  effect(TEMP tmp, TEMP dst, TEMP tmp2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5226
  format %{ "vaddss  $dst,$dst,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5227
            "pshufd  $tmp,$src2,0x01\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5228
            "vaddss  $dst,$dst,$tmp\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5229
            "pshufd  $tmp,$src2,0x02\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5230
            "vaddss  $dst,$dst,$tmp\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5231
            "pshufd  $tmp,$src2,0x03\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5232
            "vaddss  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5233
            "vextractf32x4  $tmp2,$src2,0x1\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5234
            "vaddss  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5235
            "pshufd  $tmp,$tmp2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5236
            "vaddss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5237
            "pshufd  $tmp,$tmp2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5238
            "vaddss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5239
            "pshufd  $tmp,$tmp2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5240
            "vaddss  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5241
            "vextractf32x4  $tmp2,$src2,0x2\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5242
            "vaddss  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5243
            "pshufd  $tmp,$tmp2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5244
            "vaddss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5245
            "pshufd  $tmp,$tmp2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5246
            "vaddss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5247
            "pshufd  $tmp,$tmp2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5248
            "vaddss  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5249
            "vextractf32x4  $tmp2,$src2,0x3\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5250
            "vaddss  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5251
            "pshufd  $tmp,$tmp2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5252
            "vaddss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5253
            "pshufd  $tmp,$tmp2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5254
            "vaddss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5255
            "pshufd  $tmp,$tmp2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5256
            "vaddss  $dst,$dst,$tmp\t! add reduction16F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5257
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5258
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5259
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5260
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5261
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x02);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5262
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5263
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x03);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5264
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5265
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x1);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5266
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5267
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5268
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5269
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5270
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5271
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5272
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5273
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x2);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5274
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5275
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5276
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5277
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5278
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5279
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5280
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5281
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x3);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5282
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5283
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5284
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5285
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5286
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5287
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5288
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5289
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5290
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5291
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5292
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5293
instruct rsadd2D_reduction_reg(regD dst, vecX src2, vecX tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5294
  predicate(UseSSE >= 1 && UseAVX == 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5295
  match(Set dst (AddReductionVD dst src2));
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5296
  effect(TEMP tmp, TEMP dst);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5297
  format %{ "addsd   $dst,$src2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5298
            "pshufd  $tmp,$src2,0xE\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5299
            "addsd   $dst,$tmp\t! add reduction2D" %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5300
  ins_encode %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5301
    __ addsd($dst$$XMMRegister, $src2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5302
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0xE);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5303
    __ addsd($dst$$XMMRegister, $tmp$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5304
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5305
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5306
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5307
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5308
instruct rvadd2D_reduction_reg(regD dst, vecX src2, vecX tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5309
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5310
  match(Set dst (AddReductionVD dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5311
  effect(TEMP tmp, TEMP dst);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5312
  format %{ "vaddsd  $dst,$dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5313
            "pshufd  $tmp,$src2,0xE\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5314
            "vaddsd  $dst,$dst,$tmp\t! add reduction2D" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5315
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5316
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5317
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0xE);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5318
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5319
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5320
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5321
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5322
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5323
instruct rvadd4D_reduction_reg(regD dst, vecY src2, vecX tmp, vecX tmp2) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5324
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5325
  match(Set dst (AddReductionVD dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5326
  effect(TEMP tmp, TEMP dst, TEMP tmp2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5327
  format %{ "vaddsd  $dst,$dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5328
            "pshufd  $tmp,$src2,0xE\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5329
            "vaddsd  $dst,$dst,$tmp\n\t"
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5330
            "vextractf128  $tmp2,$src2,0x1\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5331
            "vaddsd  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5332
            "pshufd  $tmp,$tmp2,0xE\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5333
            "vaddsd  $dst,$dst,$tmp\t! add reduction4D" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5334
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5335
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5336
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0xE);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5337
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5338
    __ vextractf128($tmp2$$XMMRegister, $src2$$XMMRegister, 0x1);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5339
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5340
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5341
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5342
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5343
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5344
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5345
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5346
instruct rvadd8D_reduction_reg(regD dst, legVecZ src2, legVecZ tmp, legVecZ tmp2) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5347
  predicate(UseAVX > 2);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5348
  match(Set dst (AddReductionVD dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5349
  effect(TEMP tmp, TEMP dst, TEMP tmp2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5350
  format %{ "vaddsd  $dst,$dst,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5351
            "pshufd  $tmp,$src2,0xE\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5352
            "vaddsd  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5353
            "vextractf32x4  $tmp2,$src2,0x1\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5354
            "vaddsd  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5355
            "pshufd  $tmp,$tmp2,0xE\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5356
            "vaddsd  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5357
            "vextractf32x4  $tmp2,$src2,0x2\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5358
            "vaddsd  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5359
            "pshufd  $tmp,$tmp2,0xE\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5360
            "vaddsd  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5361
            "vextractf32x4  $tmp2,$src2,0x3\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5362
            "vaddsd  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5363
            "pshufd  $tmp,$tmp2,0xE\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5364
            "vaddsd  $dst,$dst,$tmp\t! add reduction8D" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5365
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5366
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5367
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0xE);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5368
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5369
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x1);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5370
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5371
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5372
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5373
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x2);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5374
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5375
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5376
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5377
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x3);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5378
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5379
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5380
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5381
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5382
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5383
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5384
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5385
instruct rsmul2I_reduction_reg(rRegI dst, rRegI src1, vecD src2, vecD tmp, vecD tmp2) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5386
  predicate(UseSSE > 3 && UseAVX == 0);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5387
  match(Set dst (MulReductionVI src1 src2));
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5388
  effect(TEMP tmp, TEMP tmp2);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5389
  format %{ "pshufd  $tmp2,$src2,0x1\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5390
            "pmulld  $tmp2,$src2\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5391
            "movd    $tmp,$src1\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5392
            "pmulld  $tmp2,$tmp\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5393
            "movd    $dst,$tmp2\t! mul reduction2I" %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5394
  ins_encode %{
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5395
    __ pshufd($tmp2$$XMMRegister, $src2$$XMMRegister, 0x1);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5396
    __ pmulld($tmp2$$XMMRegister, $src2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5397
    __ movdl($tmp$$XMMRegister, $src1$$Register);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5398
    __ pmulld($tmp2$$XMMRegister, $tmp$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5399
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5400
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5401
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5402
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5403
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5404
instruct rvmul2I_reduction_reg(rRegI dst, rRegI src1, vecD src2, vecD tmp, vecD tmp2) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5405
  predicate(UseAVX > 0);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5406
  match(Set dst (MulReductionVI src1 src2));
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5407
  effect(TEMP tmp, TEMP tmp2);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5408
  format %{ "pshufd   $tmp2,$src2,0x1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5409
            "vpmulld  $tmp,$src2,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5410
            "movd     $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5411
            "vpmulld  $tmp2,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5412
            "movd     $dst,$tmp2\t! mul reduction2I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5413
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5414
    int vector_len = 0;
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5415
    __ pshufd($tmp2$$XMMRegister, $src2$$XMMRegister, 0x1);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5416
    __ vpmulld($tmp$$XMMRegister, $src2$$XMMRegister, $tmp2$$XMMRegister, vector_len);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5417
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5418
    __ vpmulld($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5419
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5420
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5421
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5422
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5423
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5424
instruct rsmul4I_reduction_reg(rRegI dst, rRegI src1, vecX src2, vecX tmp, vecX tmp2) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5425
  predicate(UseSSE > 3 && UseAVX == 0);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5426
  match(Set dst (MulReductionVI src1 src2));
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5427
  effect(TEMP tmp, TEMP tmp2);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5428
  format %{ "pshufd  $tmp2,$src2,0xE\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5429
            "pmulld  $tmp2,$src2\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5430
            "pshufd  $tmp,$tmp2,0x1\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5431
            "pmulld  $tmp2,$tmp\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5432
            "movd    $tmp,$src1\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5433
            "pmulld  $tmp2,$tmp\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5434
            "movd    $dst,$tmp2\t! mul reduction4I" %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5435
  ins_encode %{
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5436
    __ pshufd($tmp2$$XMMRegister, $src2$$XMMRegister, 0xE);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5437
    __ pmulld($tmp2$$XMMRegister, $src2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5438
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x1);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5439
    __ pmulld($tmp2$$XMMRegister, $tmp$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5440
    __ movdl($tmp$$XMMRegister, $src1$$Register);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5441
    __ pmulld($tmp2$$XMMRegister, $tmp$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5442
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5443
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5444
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5445
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5446
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5447
instruct rvmul4I_reduction_reg(rRegI dst, rRegI src1, vecX src2, vecX tmp, vecX tmp2) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5448
  predicate(UseAVX > 0);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5449
  match(Set dst (MulReductionVI src1 src2));
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5450
  effect(TEMP tmp, TEMP tmp2);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5451
  format %{ "pshufd   $tmp2,$src2,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5452
            "vpmulld  $tmp,$src2,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5453
            "pshufd   $tmp2,$tmp,0x1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5454
            "vpmulld  $tmp,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5455
            "movd     $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5456
            "vpmulld  $tmp2,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5457
            "movd     $dst,$tmp2\t! mul reduction4I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5458
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5459
    int vector_len = 0;
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5460
    __ pshufd($tmp2$$XMMRegister, $src2$$XMMRegister, 0xE);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5461
    __ vpmulld($tmp$$XMMRegister, $src2$$XMMRegister, $tmp2$$XMMRegister, vector_len);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5462
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0x1);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5463
    __ vpmulld($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5464
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5465
    __ vpmulld($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5466
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5467
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5468
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5469
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5470
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5471
instruct rvmul8I_reduction_reg(rRegI dst, rRegI src1, vecY src2, vecY tmp, vecY tmp2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5472
  predicate(UseAVX > 1);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5473
  match(Set dst (MulReductionVI src1 src2));
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5474
  effect(TEMP tmp, TEMP tmp2);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5475
  format %{ "vextracti128_high  $tmp,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5476
            "vpmulld  $tmp,$tmp,$src2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5477
            "pshufd   $tmp2,$tmp,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5478
            "vpmulld  $tmp,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5479
            "pshufd   $tmp2,$tmp,0x1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5480
            "vpmulld  $tmp,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5481
            "movd     $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5482
            "vpmulld  $tmp2,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5483
            "movd     $dst,$tmp2\t! mul reduction8I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5484
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5485
    int vector_len = 0;
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5486
    __ vextracti128_high($tmp$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5487
    __ vpmulld($tmp$$XMMRegister, $tmp$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5488
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5489
    __ vpmulld($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5490
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0x1);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5491
    __ vpmulld($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5492
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5493
    __ vpmulld($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5494
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5495
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5496
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5497
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5498
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5499
instruct rvmul16I_reduction_reg(rRegI dst, rRegI src1, legVecZ src2, legVecZ tmp, legVecZ tmp2, legVecZ tmp3) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5500
  predicate(UseAVX > 2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5501
  match(Set dst (MulReductionVI src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5502
  effect(TEMP tmp, TEMP tmp2, TEMP tmp3);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5503
  format %{ "vextracti64x4_high  $tmp3,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5504
            "vpmulld  $tmp3,$tmp3,$src2\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5505
            "vextracti128_high  $tmp,$tmp3\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5506
            "vpmulld  $tmp,$tmp,$src2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5507
            "pshufd   $tmp2,$tmp,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5508
            "vpmulld  $tmp,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5509
            "pshufd   $tmp2,$tmp,0x1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5510
            "vpmulld  $tmp,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5511
            "movd     $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5512
            "vpmulld  $tmp2,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5513
            "movd     $dst,$tmp2\t! mul reduction16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5514
  ins_encode %{
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5515
    __ vextracti64x4_high($tmp3$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5516
    __ vpmulld($tmp3$$XMMRegister, $tmp3$$XMMRegister, $src2$$XMMRegister, 1);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5517
    __ vextracti128_high($tmp$$XMMRegister, $tmp3$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5518
    __ vpmulld($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp3$$XMMRegister, 0);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5519
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0xE);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5520
    __ vpmulld($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, 0);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5521
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0x1);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5522
    __ vpmulld($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, 0);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5523
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5524
    __ vpmulld($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, 0);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5525
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5526
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5527
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5528
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5529
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5530
#ifdef _LP64
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5531
instruct rvmul2L_reduction_reg(rRegL dst, rRegL src1, vecX src2, vecX tmp, vecX tmp2) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5532
  predicate(UseAVX > 2 && VM_Version::supports_avx512dq());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5533
  match(Set dst (MulReductionVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5534
  effect(TEMP tmp, TEMP tmp2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5535
  format %{ "pshufd   $tmp2,$src2,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5536
            "vpmullq  $tmp,$src2,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5537
            "movdq    $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5538
            "vpmullq  $tmp2,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5539
            "movdq    $dst,$tmp2\t! mul reduction2L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5540
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5541
    __ pshufd($tmp2$$XMMRegister, $src2$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5542
    __ vpmullq($tmp$$XMMRegister, $src2$$XMMRegister, $tmp2$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5543
    __ movdq($tmp2$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5544
    __ vpmullq($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5545
    __ movdq($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5546
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5547
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5548
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5549
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5550
instruct rvmul4L_reduction_reg(rRegL dst, rRegL src1, vecY src2, vecY tmp, vecY tmp2) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5551
  predicate(UseAVX > 2 && VM_Version::supports_avx512dq());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5552
  match(Set dst (MulReductionVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5553
  effect(TEMP tmp, TEMP tmp2);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5554
  format %{ "vextracti128_high  $tmp,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5555
            "vpmullq  $tmp2,$tmp,$src2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5556
            "pshufd   $tmp,$tmp2,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5557
            "vpmullq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5558
            "movdq    $tmp,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5559
            "vpmullq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5560
            "movdq    $dst,$tmp2\t! mul reduction4L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5561
  ins_encode %{
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5562
    __ vextracti128_high($tmp$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5563
    __ vpmullq($tmp2$$XMMRegister, $tmp$$XMMRegister, $src2$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5564
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5565
    __ vpmullq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5566
    __ movdq($tmp$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5567
    __ vpmullq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5568
    __ movdq($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5569
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5570
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5571
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5572
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5573
instruct rvmul8L_reduction_reg(rRegL dst, rRegL src1, legVecZ src2, legVecZ tmp, legVecZ tmp2) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5574
  predicate(UseAVX > 2 && VM_Version::supports_avx512dq());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5575
  match(Set dst (MulReductionVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5576
  effect(TEMP tmp, TEMP tmp2);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5577
  format %{ "vextracti64x4_high  $tmp2,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5578
            "vpmullq  $tmp2,$tmp2,$src2\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5579
            "vextracti128_high  $tmp,$tmp2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5580
            "vpmullq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5581
            "pshufd   $tmp,$tmp2,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5582
            "vpmullq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5583
            "movdq    $tmp,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5584
            "vpmullq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5585
            "movdq    $dst,$tmp2\t! mul reduction8L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5586
  ins_encode %{
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5587
    __ vextracti64x4_high($tmp2$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5588
    __ vpmullq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $src2$$XMMRegister, 1);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5589
    __ vextracti128_high($tmp$$XMMRegister, $tmp2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5590
    __ vpmullq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5591
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5592
    __ vpmullq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5593
    __ movdq($tmp$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5594
    __ vpmullq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5595
    __ movdq($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5596
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5597
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5598
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5599
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5600
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5601
instruct rsmul2F_reduction(regF dst, vecD src2, vecD tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5602
  predicate(UseSSE >= 1 && UseAVX == 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5603
  match(Set dst (MulReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5604
  effect(TEMP dst, TEMP tmp);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5605
  format %{ "mulss   $dst,$src2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5606
            "pshufd  $tmp,$src2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5607
            "mulss   $dst,$tmp\t! mul reduction2F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5608
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5609
    __ mulss($dst$$XMMRegister, $src2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5610
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5611
    __ mulss($dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5612
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5613
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5614
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5615
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5616
instruct rvmul2F_reduction_reg(regF dst, vecD src2, vecD tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5617
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5618
  match(Set dst (MulReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5619
  effect(TEMP tmp, TEMP dst);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5620
  format %{ "vmulss  $dst,$dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5621
            "pshufd  $tmp,$src2,0x01\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5622
            "vmulss  $dst,$dst,$tmp\t! mul reduction2F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5623
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5624
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5625
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5626
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5627
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5628
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5629
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5630
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5631
instruct rsmul4F_reduction_reg(regF dst, vecX src2, vecX tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5632
  predicate(UseSSE >= 1 && UseAVX == 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5633
  match(Set dst (MulReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5634
  effect(TEMP dst, TEMP tmp);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5635
  format %{ "mulss   $dst,$src2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5636
            "pshufd  $tmp,$src2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5637
            "mulss   $dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5638
            "pshufd  $tmp,$src2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5639
            "mulss   $dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5640
            "pshufd  $tmp,$src2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5641
            "mulss   $dst,$tmp\t! mul reduction4F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5642
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5643
    __ mulss($dst$$XMMRegister, $src2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5644
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5645
    __ mulss($dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5646
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5647
    __ mulss($dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5648
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5649
    __ mulss($dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5650
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5651
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5652
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5653
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5654
instruct rvmul4F_reduction_reg(regF dst, vecX src2, vecX tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5655
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5656
  match(Set dst (MulReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5657
  effect(TEMP tmp, TEMP dst);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5658
  format %{ "vmulss  $dst,$dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5659
            "pshufd  $tmp,$src2,0x01\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5660
            "vmulss  $dst,$dst,$tmp\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5661
            "pshufd  $tmp,$src2,0x02\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5662
            "vmulss  $dst,$dst,$tmp\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5663
            "pshufd  $tmp,$src2,0x03\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5664
            "vmulss  $dst,$dst,$tmp\t! mul reduction4F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5665
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5666
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5667
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5668
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5669
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x02);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5670
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5671
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x03);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5672
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5673
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5674
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5675
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5676
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5677
instruct rvmul8F_reduction_reg(regF dst, vecY src2, vecY tmp, vecY tmp2) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5678
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5679
  match(Set dst (MulReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5680
  effect(TEMP tmp, TEMP dst, TEMP tmp2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5681
  format %{ "vmulss  $dst,$dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5682
            "pshufd  $tmp,$src2,0x01\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5683
            "vmulss  $dst,$dst,$tmp\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5684
            "pshufd  $tmp,$src2,0x02\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5685
            "vmulss  $dst,$dst,$tmp\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5686
            "pshufd  $tmp,$src2,0x03\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5687
            "vmulss  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5688
            "vextractf128_high  $tmp2,$src2\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5689
            "vmulss  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5690
            "pshufd  $tmp,$tmp2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5691
            "vmulss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5692
            "pshufd  $tmp,$tmp2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5693
            "vmulss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5694
            "pshufd  $tmp,$tmp2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5695
            "vmulss  $dst,$dst,$tmp\t! mul reduction8F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5696
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5697
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5698
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5699
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5700
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x02);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5701
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5702
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x03);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5703
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5704
    __ vextractf128_high($tmp2$$XMMRegister, $src2$$XMMRegister);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5705
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5706
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5707
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5708
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5709
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5710
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5711
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5712
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5713
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5714
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5715
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5716
instruct rvmul16F_reduction_reg(regF dst, legVecZ src2, legVecZ tmp, legVecZ tmp2) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5717
  predicate(UseAVX > 2);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5718
  match(Set dst (MulReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5719
  effect(TEMP tmp, TEMP dst, TEMP tmp2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5720
  format %{ "vmulss  $dst,$dst,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5721
            "pshufd  $tmp,$src2,0x01\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5722
            "vmulss  $dst,$dst,$tmp\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5723
            "pshufd  $tmp,$src2,0x02\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5724
            "vmulss  $dst,$dst,$tmp\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5725
            "pshufd  $tmp,$src2,0x03\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5726
            "vmulss  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5727
            "vextractf32x4  $tmp2,$src2,0x1\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5728
            "vmulss  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5729
            "pshufd  $tmp,$tmp2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5730
            "vmulss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5731
            "pshufd  $tmp,$tmp2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5732
            "vmulss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5733
            "pshufd  $tmp,$tmp2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5734
            "vmulss  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5735
            "vextractf32x4  $tmp2,$src2,0x2\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5736
            "vmulss  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5737
            "pshufd  $tmp,$tmp2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5738
            "vmulss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5739
            "pshufd  $tmp,$tmp2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5740
            "vmulss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5741
            "pshufd  $tmp,$tmp2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5742
            "vmulss  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5743
            "vextractf32x4  $tmp2,$src2,0x3\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5744
            "vmulss  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5745
            "pshufd  $tmp,$tmp2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5746
            "vmulss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5747
            "pshufd  $tmp,$tmp2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5748
            "vmulss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5749
            "pshufd  $tmp,$tmp2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5750
            "vmulss  $dst,$dst,$tmp\t! mul reduction16F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5751
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5752
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5753
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5754
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5755
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x02);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5756
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5757
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x03);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5758
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5759
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x1);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5760
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5761
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5762
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5763
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5764
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5765
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5766
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5767
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x2);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5768
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5769
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5770
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5771
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5772
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5773
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5774
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5775
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x3);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5776
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5777
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5778
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5779
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5780
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5781
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5782
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5783
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5784
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5785
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5786
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5787
instruct rsmul2D_reduction_reg(regD dst, vecX src2, vecX tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5788
  predicate(UseSSE >= 1 && UseAVX == 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5789
  match(Set dst (MulReductionVD dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5790
  effect(TEMP dst, TEMP tmp);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5791
  format %{ "mulsd   $dst,$src2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5792
            "pshufd  $tmp,$src2,0xE\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5793
            "mulsd   $dst,$tmp\t! mul reduction2D" %}
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5794
  ins_encode %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5795
    __ mulsd($dst$$XMMRegister, $src2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5796
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0xE);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5797
    __ mulsd($dst$$XMMRegister, $tmp$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5798
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5799
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5800
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5801
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5802
instruct rvmul2D_reduction_reg(regD dst, vecX src2, vecX tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5803
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5804
  match(Set dst (MulReductionVD dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5805
  effect(TEMP tmp, TEMP dst);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5806
  format %{ "vmulsd  $dst,$dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5807
            "pshufd  $tmp,$src2,0xE\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5808
            "vmulsd  $dst,$dst,$tmp\t! mul reduction2D" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5809
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5810
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5811
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0xE);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5812
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5813
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5814
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5815
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5816
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5817
instruct rvmul4D_reduction_reg(regD dst, vecY src2, vecY tmp, vecY tmp2) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5818
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5819
  match(Set dst (MulReductionVD dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5820
  effect(TEMP tmp, TEMP dst, TEMP tmp2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5821
  format %{ "vmulsd  $dst,$dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5822
            "pshufd  $tmp,$src2,0xE\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5823
            "vmulsd  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5824
            "vextractf128_high  $tmp2,$src2\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5825
            "vmulsd  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5826
            "pshufd  $tmp,$tmp2,0xE\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5827
            "vmulsd  $dst,$dst,$tmp\t! mul reduction4D" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5828
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5829
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5830
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0xE);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5831
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5832
    __ vextractf128_high($tmp2$$XMMRegister, $src2$$XMMRegister);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5833
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5834
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5835
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5836
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5837
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5838
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5839
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5840
instruct rvmul8D_reduction_reg(regD dst, legVecZ src2, legVecZ tmp, legVecZ tmp2) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5841
  predicate(UseAVX > 2);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5842
  match(Set dst (MulReductionVD dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5843
  effect(TEMP tmp, TEMP dst, TEMP tmp2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5844
  format %{ "vmulsd  $dst,$dst,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5845
            "pshufd  $tmp,$src2,0xE\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5846
            "vmulsd  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5847
            "vextractf32x4  $tmp2,$src2,0x1\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5848
            "vmulsd  $dst,$dst,$tmp2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5849
            "pshufd  $tmp,$src2,0xE\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5850
            "vmulsd  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5851
            "vextractf32x4  $tmp2,$src2,0x2\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5852
            "vmulsd  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5853
            "pshufd  $tmp,$tmp2,0xE\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5854
            "vmulsd  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5855
            "vextractf32x4  $tmp2,$src2,0x3\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5856
            "vmulsd  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5857
            "pshufd  $tmp,$tmp2,0xE\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5858
            "vmulsd  $dst,$dst,$tmp\t! mul reduction8D" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5859
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5860
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5861
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0xE);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5862
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5863
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x1);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5864
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5865
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5866
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5867
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x2);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5868
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5869
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5870
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5871
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x3);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5872
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5873
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5874
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5875
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5876
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5877
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5878
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5879
// ====================VECTOR ARITHMETIC=======================================
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5880
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5881
// --------------------------------- ADD --------------------------------------
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5882
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5883
// Bytes vector add
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5884
instruct vadd4B(vecS dst, vecS src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5885
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5886
  match(Set dst (AddVB dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5887
  format %{ "paddb   $dst,$src\t! add packed4B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5888
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5889
    __ paddb($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5890
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5891
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5892
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5893
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5894
instruct vadd4B_reg(vecS dst, vecS src1, vecS src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5895
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5896
  match(Set dst (AddVB src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5897
  format %{ "vpaddb  $dst,$src1,$src2\t! add packed4B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5898
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5899
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5900
    __ vpaddb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5901
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5902
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5903
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5904
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5905
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5906
instruct vadd4B_mem(vecS dst, vecS src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5907
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5908
  match(Set dst (AddVB src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5909
  format %{ "vpaddb  $dst,$src,$mem\t! add packed4B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5910
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5911
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5912
    __ vpaddb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5913
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5914
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5915
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5916
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5917
instruct vadd8B(vecD dst, vecD src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5918
  predicate(UseAVX == 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5919
  match(Set dst (AddVB dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5920
  format %{ "paddb   $dst,$src\t! add packed8B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5921
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5922
    __ paddb($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5923
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5924
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5925
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5926
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5927
instruct vadd8B_reg(vecD dst, vecD src1, vecD src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5928
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5929
  match(Set dst (AddVB src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5930
  format %{ "vpaddb  $dst,$src1,$src2\t! add packed8B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5931
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5932
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5933
    __ vpaddb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5934
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5935
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5936
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5937
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5938
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5939
instruct vadd8B_mem(vecD dst, vecD src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5940
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5941
  match(Set dst (AddVB src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5942
  format %{ "vpaddb  $dst,$src,$mem\t! add packed8B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5943
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5944
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5945
    __ vpaddb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5946
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5947
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5948
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5949
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5950
instruct vadd16B(vecX dst, vecX src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5951
  predicate(UseAVX == 0 && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5952
  match(Set dst (AddVB dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5953
  format %{ "paddb   $dst,$src\t! add packed16B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5954
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5955
    __ paddb($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5956
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5957
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5958
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5959
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5960
instruct vadd16B_reg(vecX dst, vecX src1, vecX src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5961
  predicate(UseAVX > 0  && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5962
  match(Set dst (AddVB src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5963
  format %{ "vpaddb  $dst,$src1,$src2\t! add packed16B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5964
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5965
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5966
    __ vpaddb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5967
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5968
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5969
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5970
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5971
instruct vadd16B_mem(vecX dst, vecX src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5972
  predicate(UseAVX > 0 && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5973
  match(Set dst (AddVB src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5974
  format %{ "vpaddb  $dst,$src,$mem\t! add packed16B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5975
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5976
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5977
    __ vpaddb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5978
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5979
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5980
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5981
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5982
instruct vadd32B_reg(vecY dst, vecY src1, vecY src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5983
  predicate(UseAVX > 1 && n->as_Vector()->length() == 32);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5984
  match(Set dst (AddVB src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5985
  format %{ "vpaddb  $dst,$src1,$src2\t! add packed32B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5986
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5987
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5988
    __ vpaddb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5989
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5990
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5991
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5992
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5993
instruct vadd32B_mem(vecY dst, vecY src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  5994
  predicate(UseAVX > 1 && n->as_Vector()->length() == 32);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5995
  match(Set dst (AddVB src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5996
  format %{ "vpaddb  $dst,$src,$mem\t! add packed32B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5997
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5998
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5999
    __ vpaddb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6000
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6001
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6002
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6003
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6004
instruct vadd64B_reg(vecZ dst, vecZ src1, vecZ src2) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6005
  predicate(UseAVX > 2 && VM_Version::supports_avx512bw() && n->as_Vector()->length() == 64);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6006
  match(Set dst (AddVB src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6007
  format %{ "vpaddb  $dst,$src1,$src2\t! add packed64B" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6008
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6009
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6010
    __ vpaddb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6011
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6012
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6013
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6014
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6015
instruct vadd64B_mem(vecZ dst, vecZ src, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6016
  predicate(UseAVX > 2 && VM_Version::supports_avx512bw() && n->as_Vector()->length() == 64);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6017
  match(Set dst (AddVB src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6018
  format %{ "vpaddb  $dst,$src,$mem\t! add packed64B" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6019
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6020
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6021
    __ vpaddb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6022
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6023
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6024
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6025
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6026
// Shorts/Chars vector add
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6027
instruct vadd2S(vecS dst, vecS src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6028
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6029
  match(Set dst (AddVS dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6030
  format %{ "paddw   $dst,$src\t! add packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6031
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6032
    __ paddw($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6033
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6034
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6035
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6036
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6037
instruct vadd2S_reg(vecS dst, vecS src1, vecS src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6038
  predicate(UseAVX > 0  && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6039
  match(Set dst (AddVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6040
  format %{ "vpaddw  $dst,$src1,$src2\t! add packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6041
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6042
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6043
    __ vpaddw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6044
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6045
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6046
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6047
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6048
instruct vadd2S_mem(vecS dst, vecS src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6049
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6050
  match(Set dst (AddVS src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6051
  format %{ "vpaddw  $dst,$src,$mem\t! add packed2S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6052
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6053
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6054
    __ vpaddw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6055
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6056
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6057
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6058
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6059
instruct vadd4S(vecD dst, vecD src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6060
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6061
  match(Set dst (AddVS dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6062
  format %{ "paddw   $dst,$src\t! add packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6063
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6064
    __ paddw($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6065
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6066
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6067
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6068
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6069
instruct vadd4S_reg(vecD dst, vecD src1, vecD src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6070
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6071
  match(Set dst (AddVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6072
  format %{ "vpaddw  $dst,$src1,$src2\t! add packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6073
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6074
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6075
    __ vpaddw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6076
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6077
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6078
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6079
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6080
instruct vadd4S_mem(vecD dst, vecD src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6081
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6082
  match(Set dst (AddVS src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6083
  format %{ "vpaddw  $dst,$src,$mem\t! add packed4S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6084
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6085
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6086
    __ vpaddw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6087
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6088
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6089
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6090
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6091
instruct vadd8S(vecX dst, vecX src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6092
  predicate(UseAVX == 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6093
  match(Set dst (AddVS dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6094
  format %{ "paddw   $dst,$src\t! add packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6095
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6096
    __ paddw($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6097
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6098
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6099
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6100
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6101
instruct vadd8S_reg(vecX dst, vecX src1, vecX src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6102
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6103
  match(Set dst (AddVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6104
  format %{ "vpaddw  $dst,$src1,$src2\t! add packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6105
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6106
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6107
    __ vpaddw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6108
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6109
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6110
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6111
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6112
instruct vadd8S_mem(vecX dst, vecX src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6113
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6114
  match(Set dst (AddVS src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6115
  format %{ "vpaddw  $dst,$src,$mem\t! add packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6116
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6117
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6118
    __ vpaddw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6119
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6120
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6121
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6122
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6123
instruct vadd16S_reg(vecY dst, vecY src1, vecY src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6124
  predicate(UseAVX > 1 && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6125
  match(Set dst (AddVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6126
  format %{ "vpaddw  $dst,$src1,$src2\t! add packed16S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6127
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6128
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6129
    __ vpaddw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6130
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6131
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6132
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6133
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6134
instruct vadd16S_mem(vecY dst, vecY src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6135
  predicate(UseAVX > 1 && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6136
  match(Set dst (AddVS src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6137
  format %{ "vpaddw  $dst,$src,$mem\t! add packed16S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6138
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6139
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6140
    __ vpaddw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6141
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6142
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6143
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6144
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6145
instruct vadd32S_reg(vecZ dst, vecZ src1, vecZ src2) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6146
  predicate(UseAVX > 2 && VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6147
  match(Set dst (AddVS src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6148
  format %{ "vpaddw  $dst,$src1,$src2\t! add packed32S" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6149
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6150
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6151
    __ vpaddw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6152
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6153
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6154
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6155
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6156
instruct vadd32S_mem(vecZ dst, vecZ src, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6157
  predicate(UseAVX > 2 && VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6158
  match(Set dst (AddVS src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6159
  format %{ "vpaddw  $dst,$src,$mem\t! add packed32S" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6160
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6161
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6162
    __ vpaddw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6163
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6164
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6165
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6166
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6167
// Integers vector add
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6168
instruct vadd2I(vecD dst, vecD src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6169
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6170
  match(Set dst (AddVI dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6171
  format %{ "paddd   $dst,$src\t! add packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6172
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6173
    __ paddd($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6174
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6175
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6176
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6177
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6178
instruct vadd2I_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6179
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6180
  match(Set dst (AddVI src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6181
  format %{ "vpaddd  $dst,$src1,$src2\t! add packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6182
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6183
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6184
    __ vpaddd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6185
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6186
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6187
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6188
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6189
instruct vadd2I_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6190
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6191
  match(Set dst (AddVI src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6192
  format %{ "vpaddd  $dst,$src,$mem\t! add packed2I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6193
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6194
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6195
    __ vpaddd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6196
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6197
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6198
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6199
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6200
instruct vadd4I(vecX dst, vecX src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6201
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6202
  match(Set dst (AddVI dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6203
  format %{ "paddd   $dst,$src\t! add packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6204
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6205
    __ paddd($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6206
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6207
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6208
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6209
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6210
instruct vadd4I_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6211
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6212
  match(Set dst (AddVI src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6213
  format %{ "vpaddd  $dst,$src1,$src2\t! add packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6214
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6215
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6216
    __ vpaddd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6217
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6218
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6219
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6220
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6221
instruct vadd4I_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6222
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6223
  match(Set dst (AddVI src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6224
  format %{ "vpaddd  $dst,$src,$mem\t! add packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6225
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6226
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6227
    __ vpaddd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6228
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6229
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6230
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6231
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6232
instruct vadd8I_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6233
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6234
  match(Set dst (AddVI src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6235
  format %{ "vpaddd  $dst,$src1,$src2\t! add packed8I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6236
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6237
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6238
    __ vpaddd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6239
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6240
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6241
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6242
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6243
instruct vadd8I_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6244
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6245
  match(Set dst (AddVI src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6246
  format %{ "vpaddd  $dst,$src,$mem\t! add packed8I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6247
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6248
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6249
    __ vpaddd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6250
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6251
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6252
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6253
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6254
instruct vadd16I_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6255
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6256
  match(Set dst (AddVI src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6257
  format %{ "vpaddd  $dst,$src1,$src2\t! add packed16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6258
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6259
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6260
    __ vpaddd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6261
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6262
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6263
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6264
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6265
instruct vadd16I_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6266
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6267
  match(Set dst (AddVI src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6268
  format %{ "vpaddd  $dst,$src,$mem\t! add packed16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6269
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6270
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6271
    __ vpaddd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6272
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6273
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6274
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6275
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6276
// Longs vector add
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6277
instruct vadd2L(vecX dst, vecX src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6278
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6279
  match(Set dst (AddVL dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6280
  format %{ "paddq   $dst,$src\t! add packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6281
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6282
    __ paddq($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6283
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6284
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6285
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6286
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6287
instruct vadd2L_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6288
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6289
  match(Set dst (AddVL src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6290
  format %{ "vpaddq  $dst,$src1,$src2\t! add packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6291
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6292
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6293
    __ vpaddq($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6294
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6295
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6296
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6297
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6298
instruct vadd2L_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6299
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6300
  match(Set dst (AddVL src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6301
  format %{ "vpaddq  $dst,$src,$mem\t! add packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6302
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6303
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6304
    __ vpaddq($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6305
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6306
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6307
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6308
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6309
instruct vadd4L_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6310
  predicate(UseAVX > 1 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6311
  match(Set dst (AddVL src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6312
  format %{ "vpaddq  $dst,$src1,$src2\t! add packed4L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6313
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6314
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6315
    __ vpaddq($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6316
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6317
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6318
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6319
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6320
instruct vadd4L_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6321
  predicate(UseAVX > 1 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6322
  match(Set dst (AddVL src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6323
  format %{ "vpaddq  $dst,$src,$mem\t! add packed4L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6324
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6325
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6326
    __ vpaddq($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6327
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6328
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6329
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6330
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6331
instruct vadd8L_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6332
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6333
  match(Set dst (AddVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6334
  format %{ "vpaddq  $dst,$src1,$src2\t! add packed8L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6335
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6336
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6337
    __ vpaddq($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6338
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6339
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6340
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6341
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6342
instruct vadd8L_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6343
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6344
  match(Set dst (AddVL src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6345
  format %{ "vpaddq  $dst,$src,$mem\t! add packed8L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6346
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6347
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6348
    __ vpaddq($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6349
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6350
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6351
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6352
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6353
// Floats vector add
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6354
instruct vadd2F(vecD dst, vecD src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6355
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6356
  match(Set dst (AddVF dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6357
  format %{ "addps   $dst,$src\t! add packed2F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6358
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6359
    __ addps($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6360
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6361
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6362
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6363
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6364
instruct vadd2F_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6365
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6366
  match(Set dst (AddVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6367
  format %{ "vaddps  $dst,$src1,$src2\t! add packed2F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6368
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6369
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6370
    __ vaddps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6371
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6372
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6373
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6374
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6375
instruct vadd2F_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6376
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6377
  match(Set dst (AddVF src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6378
  format %{ "vaddps  $dst,$src,$mem\t! add packed2F" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6379
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6380
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6381
    __ vaddps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6382
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6383
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6384
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6385
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6386
instruct vadd4F(vecX dst, vecX src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6387
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6388
  match(Set dst (AddVF dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6389
  format %{ "addps   $dst,$src\t! add packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6390
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6391
    __ addps($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6392
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6393
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6394
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6395
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6396
instruct vadd4F_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6397
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6398
  match(Set dst (AddVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6399
  format %{ "vaddps  $dst,$src1,$src2\t! add packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6400
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6401
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6402
    __ vaddps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6403
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6404
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6405
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6406
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6407
instruct vadd4F_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6408
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6409
  match(Set dst (AddVF src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6410
  format %{ "vaddps  $dst,$src,$mem\t! add packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6411
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6412
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6413
    __ vaddps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6414
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6415
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6416
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6417
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6418
instruct vadd8F_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6419
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6420
  match(Set dst (AddVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6421
  format %{ "vaddps  $dst,$src1,$src2\t! add packed8F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6422
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6423
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6424
    __ vaddps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6425
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6426
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6427
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6428
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6429
instruct vadd8F_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6430
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6431
  match(Set dst (AddVF src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6432
  format %{ "vaddps  $dst,$src,$mem\t! add packed8F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6433
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6434
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6435
    __ vaddps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6436
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6437
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6438
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6439
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6440
instruct vadd16F_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6441
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6442
  match(Set dst (AddVF src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6443
  format %{ "vaddps  $dst,$src1,$src2\t! add packed16F" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6444
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6445
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6446
    __ vaddps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6447
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6448
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6449
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6450
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6451
instruct vadd16F_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6452
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6453
  match(Set dst (AddVF src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6454
  format %{ "vaddps  $dst,$src,$mem\t! add packed16F" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6455
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6456
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6457
    __ vaddps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6458
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6459
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6460
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6461
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6462
// Doubles vector add
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6463
instruct vadd2D(vecX dst, vecX src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6464
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6465
  match(Set dst (AddVD dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6466
  format %{ "addpd   $dst,$src\t! add packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6467
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6468
    __ addpd($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6469
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6470
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6471
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6472
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6473
instruct vadd2D_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6474
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6475
  match(Set dst (AddVD src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6476
  format %{ "vaddpd  $dst,$src1,$src2\t! add packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6477
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6478
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6479
    __ vaddpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6480
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6481
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6482
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6483
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6484
instruct vadd2D_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6485
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6486
  match(Set dst (AddVD src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6487
  format %{ "vaddpd  $dst,$src,$mem\t! add packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6488
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6489
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6490
    __ vaddpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6491
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6492
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6493
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6494
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6495
instruct vadd4D_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6496
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6497
  match(Set dst (AddVD src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6498
  format %{ "vaddpd  $dst,$src1,$src2\t! add packed4D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6499
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6500
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6501
    __ vaddpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6502
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6503
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6504
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6505
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6506
instruct vadd4D_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6507
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6508
  match(Set dst (AddVD src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6509
  format %{ "vaddpd  $dst,$src,$mem\t! add packed4D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6510
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6511
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6512
    __ vaddpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6513
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6514
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6515
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6516
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6517
instruct vadd8D_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6518
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6519
  match(Set dst (AddVD src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6520
  format %{ "vaddpd  $dst,$src1,$src2\t! add packed8D" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6521
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6522
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6523
    __ vaddpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6524
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6525
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6526
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6527
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6528
instruct vadd8D_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6529
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6530
  match(Set dst (AddVD src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6531
  format %{ "vaddpd  $dst,$src,$mem\t! add packed8D" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6532
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6533
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6534
    __ vaddpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6535
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6536
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6537
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6538
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6539
// --------------------------------- SUB --------------------------------------
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6540
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6541
// Bytes vector sub
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6542
instruct vsub4B(vecS dst, vecS src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6543
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6544
  match(Set dst (SubVB dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6545
  format %{ "psubb   $dst,$src\t! sub packed4B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6546
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6547
    __ psubb($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6548
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6549
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6550
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6551
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6552
instruct vsub4B_reg(vecS dst, vecS src1, vecS src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6553
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6554
  match(Set dst (SubVB src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6555
  format %{ "vpsubb  $dst,$src1,$src2\t! sub packed4B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6556
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6557
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6558
    __ vpsubb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6559
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6560
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6561
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6562
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6563
instruct vsub4B_mem(vecS dst, vecS src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6564
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6565
  match(Set dst (SubVB src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6566
  format %{ "vpsubb  $dst,$src,$mem\t! sub packed4B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6567
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6568
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6569
    __ vpsubb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6570
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6571
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6572
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6573
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6574
instruct vsub8B(vecD dst, vecD src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6575
  predicate(UseAVX == 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6576
  match(Set dst (SubVB dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6577
  format %{ "psubb   $dst,$src\t! sub packed8B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6578
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6579
    __ psubb($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6580
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6581
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6582
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6583
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6584
instruct vsub8B_reg(vecD dst, vecD src1, vecD src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6585
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6586
  match(Set dst (SubVB src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6587
  format %{ "vpsubb  $dst,$src1,$src2\t! sub packed8B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6588
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6589
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6590
    __ vpsubb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6591
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6592
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6593
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6594
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6595
instruct vsub8B_mem(vecD dst, vecD src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6596
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6597
  match(Set dst (SubVB src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6598
  format %{ "vpsubb  $dst,$src,$mem\t! sub packed8B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6599
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6600
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6601
    __ vpsubb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6602
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6603
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6604
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6605
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6606
instruct vsub16B(vecX dst, vecX src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6607
  predicate(UseAVX == 0 && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6608
  match(Set dst (SubVB dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6609
  format %{ "psubb   $dst,$src\t! sub packed16B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6610
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6611
    __ psubb($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6612
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6613
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6614
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6615
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6616
instruct vsub16B_reg(vecX dst, vecX src1, vecX src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6617
  predicate(UseAVX > 0 && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6618
  match(Set dst (SubVB src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6619
  format %{ "vpsubb  $dst,$src1,$src2\t! sub packed16B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6620
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6621
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6622
    __ vpsubb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6623
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6624
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6625
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6626
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6627
instruct vsub16B_mem(vecX dst, vecX src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6628
  predicate(UseAVX > 0 && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6629
  match(Set dst (SubVB src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6630
  format %{ "vpsubb  $dst,$src,$mem\t! sub packed16B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6631
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6632
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6633
    __ vpsubb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6634
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6635
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6636
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6637
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6638
instruct vsub32B_reg(vecY dst, vecY src1, vecY src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6639
  predicate(UseAVX > 1 && n->as_Vector()->length() == 32);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6640
  match(Set dst (SubVB src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6641
  format %{ "vpsubb  $dst,$src1,$src2\t! sub packed32B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6642
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6643
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6644
    __ vpsubb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6645
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6646
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6647
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6648
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6649
instruct vsub32B_mem(vecY dst, vecY src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6650
  predicate(UseAVX > 1 && n->as_Vector()->length() == 32);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6651
  match(Set dst (SubVB src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6652
  format %{ "vpsubb  $dst,$src,$mem\t! sub packed32B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6653
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6654
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6655
    __ vpsubb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6656
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6657
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6658
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6659
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6660
instruct vsub64B_reg(vecZ dst, vecZ src1, vecZ src2) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6661
  predicate(UseAVX > 2 && VM_Version::supports_avx512bw() && n->as_Vector()->length() == 64);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6662
  match(Set dst (SubVB src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6663
  format %{ "vpsubb  $dst,$src1,$src2\t! sub packed64B" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6664
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6665
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6666
    __ vpsubb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6667
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6668
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6669
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6670
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6671
instruct vsub64B_mem(vecZ dst, vecZ src, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6672
  predicate(UseAVX > 2 && VM_Version::supports_avx512bw() && n->as_Vector()->length() == 64);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6673
  match(Set dst (SubVB src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6674
  format %{ "vpsubb  $dst,$src,$mem\t! sub packed64B" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6675
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6676
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6677
    __ vpsubb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6678
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6679
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6680
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6681
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6682
// Shorts/Chars vector sub
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6683
instruct vsub2S(vecS dst, vecS src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6684
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6685
  match(Set dst (SubVS dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6686
  format %{ "psubw   $dst,$src\t! sub packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6687
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6688
    __ psubw($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6689
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6690
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6691
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6692
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6693
instruct vsub2S_reg(vecS dst, vecS src1, vecS src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6694
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6695
  match(Set dst (SubVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6696
  format %{ "vpsubw  $dst,$src1,$src2\t! sub packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6697
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6698
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6699
    __ vpsubw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6700
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6701
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6702
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6703
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6704
instruct vsub2S_mem(vecS dst, vecS src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6705
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6706
  match(Set dst (SubVS src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6707
  format %{ "vpsubw  $dst,$src,$mem\t! sub packed2S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6708
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6709
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6710
    __ vpsubw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6711
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6712
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6713
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6714
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6715
instruct vsub4S(vecD dst, vecD src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6716
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6717
  match(Set dst (SubVS dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6718
  format %{ "psubw   $dst,$src\t! sub packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6719
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6720
    __ psubw($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6721
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6722
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6723
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6724
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6725
instruct vsub4S_reg(vecD dst, vecD src1, vecD src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6726
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6727
  match(Set dst (SubVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6728
  format %{ "vpsubw  $dst,$src1,$src2\t! sub packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6729
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6730
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6731
    __ vpsubw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6732
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6733
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6734
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6735
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6736
instruct vsub4S_mem(vecD dst, vecD src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6737
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6738
  match(Set dst (SubVS src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6739
  format %{ "vpsubw  $dst,$src,$mem\t! sub packed4S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6740
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6741
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6742
    __ vpsubw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6743
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6744
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6745
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6746
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6747
instruct vsub8S(vecX dst, vecX src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6748
  predicate(UseAVX == 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6749
  match(Set dst (SubVS dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6750
  format %{ "psubw   $dst,$src\t! sub packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6751
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6752
    __ psubw($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6753
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6754
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6755
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6756
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6757
instruct vsub8S_reg(vecX dst, vecX src1, vecX src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6758
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6759
  match(Set dst (SubVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6760
  format %{ "vpsubw  $dst,$src1,$src2\t! sub packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6761
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6762
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6763
    __ vpsubw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6764
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6765
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6766
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6767
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6768
instruct vsub8S_mem(vecX dst, vecX src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6769
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6770
  match(Set dst (SubVS src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6771
  format %{ "vpsubw  $dst,$src,$mem\t! sub packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6772
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6773
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6774
    __ vpsubw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6775
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6776
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6777
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6778
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6779
instruct vsub16S_reg(vecY dst, vecY src1, vecY src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6780
  predicate(UseAVX > 1 && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6781
  match(Set dst (SubVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6782
  format %{ "vpsubw  $dst,$src1,$src2\t! sub packed16S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6783
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6784
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6785
    __ vpsubw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6786
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6787
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6788
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6789
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6790
instruct vsub16S_mem(vecY dst, vecY src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6791
  predicate(UseAVX > 1 && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6792
  match(Set dst (SubVS src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6793
  format %{ "vpsubw  $dst,$src,$mem\t! sub packed16S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6794
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6795
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6796
    __ vpsubw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6797
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6798
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6799
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6800
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6801
instruct vsub32S_reg(vecZ dst, vecZ src1, vecZ src2) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6802
  predicate(UseAVX > 2 && VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6803
  match(Set dst (SubVS src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6804
  format %{ "vpsubw  $dst,$src1,$src2\t! sub packed32S" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6805
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6806
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6807
    __ vpsubw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6808
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6809
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6810
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6811
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6812
instruct vsub32S_mem(vecZ dst, vecZ src, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6813
  predicate(UseAVX > 2 && VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6814
  match(Set dst (SubVS src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6815
  format %{ "vpsubw  $dst,$src,$mem\t! sub packed32S" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6816
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6817
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6818
    __ vpsubw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6819
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6820
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6821
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6822
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6823
// Integers vector sub
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6824
instruct vsub2I(vecD dst, vecD src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6825
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6826
  match(Set dst (SubVI dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6827
  format %{ "psubd   $dst,$src\t! sub packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6828
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6829
    __ psubd($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6830
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6831
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6832
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6833
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6834
instruct vsub2I_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6835
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6836
  match(Set dst (SubVI src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6837
  format %{ "vpsubd  $dst,$src1,$src2\t! sub packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6838
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6839
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6840
    __ vpsubd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6841
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6842
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6843
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6844
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6845
instruct vsub2I_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6846
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6847
  match(Set dst (SubVI src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6848
  format %{ "vpsubd  $dst,$src,$mem\t! sub packed2I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6849
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6850
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6851
    __ vpsubd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6852
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6853
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6854
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6855
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6856
instruct vsub4I(vecX dst, vecX src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6857
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6858
  match(Set dst (SubVI dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6859
  format %{ "psubd   $dst,$src\t! sub packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6860
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6861
    __ psubd($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6862
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6863
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6864
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6865
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6866
instruct vsub4I_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6867
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6868
  match(Set dst (SubVI src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6869
  format %{ "vpsubd  $dst,$src1,$src2\t! sub packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6870
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6871
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6872
    __ vpsubd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6873
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6874
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6875
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6876
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6877
instruct vsub4I_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6878
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6879
  match(Set dst (SubVI src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6880
  format %{ "vpsubd  $dst,$src,$mem\t! sub packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6881
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6882
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6883
    __ vpsubd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6884
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6885
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6886
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6887
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6888
instruct vsub8I_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6889
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6890
  match(Set dst (SubVI src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6891
  format %{ "vpsubd  $dst,$src1,$src2\t! sub packed8I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6892
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6893
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6894
    __ vpsubd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6895
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6896
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6897
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6898
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6899
instruct vsub8I_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6900
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6901
  match(Set dst (SubVI src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6902
  format %{ "vpsubd  $dst,$src,$mem\t! sub packed8I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6903
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6904
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6905
    __ vpsubd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6906
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6907
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6908
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6909
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6910
instruct vsub16I_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6911
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6912
  match(Set dst (SubVI src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6913
  format %{ "vpsubd  $dst,$src1,$src2\t! sub packed16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6914
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6915
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6916
    __ vpsubd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6917
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6918
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6919
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6920
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6921
instruct vsub16I_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6922
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6923
  match(Set dst (SubVI src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6924
  format %{ "vpsubd  $dst,$src,$mem\t! sub packed16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6925
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6926
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6927
    __ vpsubd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6928
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6929
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6930
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6931
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6932
// Longs vector sub
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6933
instruct vsub2L(vecX dst, vecX src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  6934
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6935
  match(Set dst (SubVL dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6936
  format %{ "psubq   $dst,$src\t! sub packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6937
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6938
    __ psubq($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6939
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6940
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6941
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6942
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6943
instruct vsub2L_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6944
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6945
  match(Set dst (SubVL src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6946
  format %{ "vpsubq  $dst,$src1,$src2\t! sub packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6947
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6948
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6949
    __ vpsubq($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6950
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6951
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6952
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6953
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6954
instruct vsub2L_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6955
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6956
  match(Set dst (SubVL src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6957
  format %{ "vpsubq  $dst,$src,$mem\t! sub packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6958
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6959
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6960
    __ vpsubq($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6961
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6962
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6963
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6964
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6965
instruct vsub4L_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6966
  predicate(UseAVX > 1 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6967
  match(Set dst (SubVL src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6968
  format %{ "vpsubq  $dst,$src1,$src2\t! sub packed4L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6969
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6970
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6971
    __ vpsubq($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6972
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6973
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6974
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6975
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6976
instruct vsub4L_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6977
  predicate(UseAVX > 1 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6978
  match(Set dst (SubVL src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6979
  format %{ "vpsubq  $dst,$src,$mem\t! sub packed4L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6980
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6981
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6982
    __ vpsubq($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6983
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6984
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6985
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6986
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6987
instruct vsub8L_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6988
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6989
  match(Set dst (SubVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6990
  format %{ "vpsubq  $dst,$src1,$src2\t! sub packed8L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6991
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6992
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6993
    __ vpsubq($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6994
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6995
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6996
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6997
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6998
instruct vsub8L_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6999
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7000
  match(Set dst (SubVL src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7001
  format %{ "vpsubq  $dst,$src,$mem\t! sub packed8L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7002
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7003
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7004
    __ vpsubq($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7005
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7006
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7007
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7008
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7009
// Floats vector sub
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7010
instruct vsub2F(vecD dst, vecD src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7011
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7012
  match(Set dst (SubVF dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7013
  format %{ "subps   $dst,$src\t! sub packed2F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7014
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7015
    __ subps($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7016
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7017
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7018
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7019
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7020
instruct vsub2F_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7021
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7022
  match(Set dst (SubVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7023
  format %{ "vsubps  $dst,$src1,$src2\t! sub packed2F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7024
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7025
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7026
    __ vsubps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7027
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7028
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7029
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7030
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7031
instruct vsub2F_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7032
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7033
  match(Set dst (SubVF src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7034
  format %{ "vsubps  $dst,$src,$mem\t! sub packed2F" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7035
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7036
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7037
    __ vsubps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7038
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7039
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7040
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7041
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7042
instruct vsub4F(vecX dst, vecX src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7043
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7044
  match(Set dst (SubVF dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7045
  format %{ "subps   $dst,$src\t! sub packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7046
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7047
    __ subps($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7048
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7049
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7050
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7051
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7052
instruct vsub4F_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7053
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7054
  match(Set dst (SubVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7055
  format %{ "vsubps  $dst,$src1,$src2\t! sub packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7056
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7057
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7058
    __ vsubps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7059
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7060
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7061
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7062
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7063
instruct vsub4F_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7064
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7065
  match(Set dst (SubVF src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7066
  format %{ "vsubps  $dst,$src,$mem\t! sub packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7067
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7068
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7069
    __ vsubps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7070
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7071
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7072
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7073
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7074
instruct vsub8F_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7075
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7076
  match(Set dst (SubVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7077
  format %{ "vsubps  $dst,$src1,$src2\t! sub packed8F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7078
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7079
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7080
    __ vsubps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7081
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7082
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7083
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7084
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7085
instruct vsub8F_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7086
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7087
  match(Set dst (SubVF src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7088
  format %{ "vsubps  $dst,$src,$mem\t! sub packed8F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7089
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7090
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7091
    __ vsubps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7092
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7093
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7094
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7095
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7096
instruct vsub16F_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7097
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7098
  match(Set dst (SubVF src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7099
  format %{ "vsubps  $dst,$src1,$src2\t! sub packed16F" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7100
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7101
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7102
    __ vsubps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7103
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7104
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7105
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7106
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7107
instruct vsub16F_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7108
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7109
  match(Set dst (SubVF src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7110
  format %{ "vsubps  $dst,$src,$mem\t! sub packed16F" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7111
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7112
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7113
    __ vsubps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7114
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7115
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7116
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7117
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7118
// Doubles vector sub
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7119
instruct vsub2D(vecX dst, vecX src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7120
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7121
  match(Set dst (SubVD dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7122
  format %{ "subpd   $dst,$src\t! sub packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7123
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7124
    __ subpd($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7125
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7126
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7127
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7128
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7129
instruct vsub2D_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7130
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7131
  match(Set dst (SubVD src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7132
  format %{ "vsubpd  $dst,$src1,$src2\t! sub packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7133
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7134
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7135
    __ vsubpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7136
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7137
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7138
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7139
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7140
instruct vsub2D_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7141
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7142
  match(Set dst (SubVD src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7143
  format %{ "vsubpd  $dst,$src,$mem\t! sub packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7144
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7145
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7146
    __ vsubpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7147
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7148
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7149
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7150
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7151
instruct vsub4D_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7152
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7153
  match(Set dst (SubVD src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7154
  format %{ "vsubpd  $dst,$src1,$src2\t! sub packed4D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7155
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7156
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7157
    __ vsubpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7158
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7159
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7160
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7161
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7162
instruct vsub4D_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7163
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7164
  match(Set dst (SubVD src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7165
  format %{ "vsubpd  $dst,$src,$mem\t! sub packed4D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7166
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7167
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7168
    __ vsubpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7169
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7170
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7171
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7172
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7173
instruct vsub8D_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7174
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7175
  match(Set dst (SubVD src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7176
  format %{ "vsubpd  $dst,$src1,$src2\t! sub packed8D" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7177
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7178
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7179
    __ vsubpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7180
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7181
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7182
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7183
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7184
instruct vsub8D_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7185
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7186
  match(Set dst (SubVD src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7187
  format %{ "vsubpd  $dst,$src,$mem\t! sub packed8D" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7188
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7189
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7190
    __ vsubpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7191
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7192
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7193
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7194
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7195
// --------------------------------- MUL --------------------------------------
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7196
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7197
// Byte vector mul
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7198
instruct mul4B_reg(vecS dst, vecS src1, vecS src2, vecS tmp, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7199
  predicate(UseSSE > 3 && n->as_Vector()->length() == 4);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7200
  match(Set dst (MulVB src1 src2));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7201
  effect(TEMP dst, TEMP tmp, TEMP scratch);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7202
  format %{"pmovsxbw  $tmp,$src1\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7203
           "pmovsxbw  $dst,$src2\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7204
           "pmullw    $tmp,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7205
           "movdqu    $dst,[0x00ff00ff0x00ff00ff]\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7206
           "pand      $dst,$tmp\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7207
           "packuswb  $dst,$dst\t! mul packed4B" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7208
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7209
    __ pmovsxbw($tmp$$XMMRegister, $src1$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7210
    __ pmovsxbw($dst$$XMMRegister, $src2$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7211
    __ pmullw($tmp$$XMMRegister, $dst$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7212
    __ movdqu($dst$$XMMRegister, ExternalAddress(vector_short_to_byte_mask()), $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7213
    __ pand($dst$$XMMRegister, $tmp$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7214
    __ packuswb($dst$$XMMRegister, $dst$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7215
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7216
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7217
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7218
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7219
instruct mul8B_reg(vecD dst, vecD src1, vecD src2, vecD tmp, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7220
  predicate(UseSSE > 3 && n->as_Vector()->length() == 8);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7221
  match(Set dst (MulVB src1 src2));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7222
  effect(TEMP dst, TEMP tmp, TEMP scratch);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7223
  format %{"pmovsxbw  $tmp,$src1\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7224
           "pmovsxbw  $dst,$src2\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7225
           "pmullw    $tmp,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7226
           "movdqu    $dst,[0x00ff00ff0x00ff00ff]\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7227
           "pand      $dst,$tmp\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7228
           "packuswb  $dst,$dst\t! mul packed8B" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7229
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7230
    __ pmovsxbw($tmp$$XMMRegister, $src1$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7231
    __ pmovsxbw($dst$$XMMRegister, $src2$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7232
    __ pmullw($tmp$$XMMRegister, $dst$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7233
    __ movdqu($dst$$XMMRegister, ExternalAddress(vector_short_to_byte_mask()), $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7234
    __ pand($dst$$XMMRegister, $tmp$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7235
    __ packuswb($dst$$XMMRegister, $dst$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7236
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7237
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7238
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7239
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7240
instruct mul16B_reg(vecX dst, vecX src1, vecX src2, vecX tmp1, vecX tmp2, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7241
  predicate(UseSSE > 3 && n->as_Vector()->length() == 16);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7242
  match(Set dst (MulVB src1 src2));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7243
  effect(TEMP dst, TEMP tmp1, TEMP tmp2, TEMP scratch);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7244
  format %{"pmovsxbw  $tmp1,$src1\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7245
           "pmovsxbw  $tmp2,$src2\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7246
           "pmullw    $tmp1,$tmp2\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7247
           "pshufd    $tmp2,$src1,0xEE\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7248
           "pshufd    $dst,$src2,0xEE\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7249
           "pmovsxbw  $tmp2,$tmp2\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7250
           "pmovsxbw  $dst,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7251
           "pmullw    $tmp2,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7252
           "movdqu    $dst,[0x00ff00ff0x00ff00ff]\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7253
           "pand      $tmp2,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7254
           "pand      $dst,$tmp1\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7255
           "packuswb  $dst,$tmp2\t! mul packed16B" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7256
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7257
    __ pmovsxbw($tmp1$$XMMRegister, $src1$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7258
    __ pmovsxbw($tmp2$$XMMRegister, $src2$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7259
    __ pmullw($tmp1$$XMMRegister, $tmp2$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7260
    __ pshufd($tmp2$$XMMRegister, $src1$$XMMRegister, 0xEE);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7261
    __ pshufd($dst$$XMMRegister, $src2$$XMMRegister, 0xEE);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7262
    __ pmovsxbw($tmp2$$XMMRegister, $tmp2$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7263
    __ pmovsxbw($dst$$XMMRegister, $dst$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7264
    __ pmullw($tmp2$$XMMRegister, $dst$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7265
    __ movdqu($dst$$XMMRegister, ExternalAddress(vector_short_to_byte_mask()), $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7266
    __ pand($tmp2$$XMMRegister, $dst$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7267
    __ pand($dst$$XMMRegister, $tmp1$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7268
    __ packuswb($dst$$XMMRegister, $tmp2$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7269
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7270
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7271
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7272
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7273
instruct vmul16B_reg_avx(vecX dst, vecX src1, vecX src2, vecX tmp, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7274
  predicate(UseAVX > 1 && n->as_Vector()->length() == 16);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7275
  match(Set dst (MulVB src1 src2));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7276
  effect(TEMP dst, TEMP tmp, TEMP scratch);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7277
  format %{"vpmovsxbw  $tmp,$src1\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7278
           "vpmovsxbw  $dst,$src2\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7279
           "vpmullw    $tmp,$tmp,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7280
           "vmovdqu    $dst,[0x00ff00ff0x00ff00ff]\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7281
           "vpand      $dst,$dst,$tmp\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7282
           "vextracti128_high  $tmp,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7283
           "vpackuswb  $dst,$dst,$dst\n\t! mul packed16B" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7284
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7285
  int vector_len = 1;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7286
    __ vpmovsxbw($tmp$$XMMRegister, $src1$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7287
    __ vpmovsxbw($dst$$XMMRegister, $src2$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7288
    __ vpmullw($tmp$$XMMRegister, $tmp$$XMMRegister, $dst$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7289
    __ vmovdqu($dst$$XMMRegister, ExternalAddress(vector_short_to_byte_mask()), $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7290
    __ vpand($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7291
    __ vextracti128_high($tmp$$XMMRegister, $dst$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7292
    __ vpackuswb($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister, 0);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7293
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7294
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7295
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7296
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7297
instruct vmul32B_reg_avx(vecY dst, vecY src1, vecY src2, vecY tmp1, vecY tmp2, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7298
  predicate(UseAVX > 1 && n->as_Vector()->length() == 32);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7299
  match(Set dst (MulVB src1 src2));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7300
  effect(TEMP dst, TEMP tmp1, TEMP tmp2, TEMP scratch);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7301
  format %{"vextracti128_high  $tmp1,$src1\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7302
           "vextracti128_high  $dst,$src2\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7303
           "vpmovsxbw $tmp1,$tmp1\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7304
           "vpmovsxbw $dst,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7305
           "vpmullw $tmp1,$tmp1,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7306
           "vpmovsxbw $tmp2,$src1\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7307
           "vpmovsxbw $dst,$src2\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7308
           "vpmullw $tmp2,$tmp2,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7309
           "vmovdqu $dst, [0x00ff00ff0x00ff00ff]\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7310
           "vpbroadcastd $dst, $dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7311
           "vpand $tmp1,$tmp1,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7312
           "vpand $dst,$dst,$tmp2\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7313
           "vpackuswb $dst,$dst,$tmp1\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7314
           "vpermq $dst, $dst, 0xD8\t! mul packed32B" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7315
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7316
    int vector_len = 1;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7317
    __ vextracti128_high($tmp1$$XMMRegister, $src1$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7318
    __ vextracti128_high($dst$$XMMRegister, $src2$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7319
    __ vpmovsxbw($tmp1$$XMMRegister, $tmp1$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7320
    __ vpmovsxbw($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7321
    __ vpmullw($tmp1$$XMMRegister, $tmp1$$XMMRegister, $dst$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7322
    __ vpmovsxbw($tmp2$$XMMRegister, $src1$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7323
    __ vpmovsxbw($dst$$XMMRegister, $src2$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7324
    __ vpmullw($tmp2$$XMMRegister, $tmp2$$XMMRegister, $dst$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7325
    __ vmovdqu($dst$$XMMRegister, ExternalAddress(vector_short_to_byte_mask()), $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7326
    __ vpbroadcastd($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7327
    __ vpand($tmp1$$XMMRegister, $tmp1$$XMMRegister, $dst$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7328
    __ vpand($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7329
    __ vpackuswb($dst$$XMMRegister, $dst$$XMMRegister, $tmp1$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7330
    __ vpermq($dst$$XMMRegister, $dst$$XMMRegister, 0xD8, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7331
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7332
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7333
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7334
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7335
instruct vmul64B_reg_avx(vecZ dst, vecZ src1, vecZ src2, vecZ tmp1, vecZ tmp2, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7336
  predicate(UseAVX > 2 && n->as_Vector()->length() == 64);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7337
  match(Set dst (MulVB src1 src2));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7338
  effect(TEMP dst, TEMP tmp1, TEMP tmp2, TEMP scratch);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7339
  format %{"vextracti64x4_high  $tmp1,$src1\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7340
           "vextracti64x4_high  $dst,$src2\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7341
           "vpmovsxbw $tmp1,$tmp1\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7342
           "vpmovsxbw $dst,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7343
           "vpmullw $tmp1,$tmp1,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7344
           "vpmovsxbw $tmp2,$src1\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7345
           "vpmovsxbw $dst,$src2\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7346
           "vpmullw $tmp2,$tmp2,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7347
           "vmovdqu $dst, [0x00ff00ff0x00ff00ff]\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7348
           "vpbroadcastd $dst, $dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7349
           "vpand $tmp1,$tmp1,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7350
           "vpand $tmp2,$tmp2,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7351
           "vpackuswb $dst,$tmp1,$tmp2\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7352
           "evmovdquq  $tmp2,[0x0604020007050301]\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7353
           "vpermq $dst,$tmp2,$dst,0x01\t! mul packed64B" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7354
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7355
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7356
    int vector_len = 2;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7357
    __ vextracti64x4_high($tmp1$$XMMRegister, $src1$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7358
    __ vextracti64x4_high($dst$$XMMRegister, $src2$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7359
    __ vpmovsxbw($tmp1$$XMMRegister, $tmp1$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7360
    __ vpmovsxbw($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7361
    __ vpmullw($tmp1$$XMMRegister, $tmp1$$XMMRegister, $dst$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7362
    __ vpmovsxbw($tmp2$$XMMRegister, $src1$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7363
    __ vpmovsxbw($dst$$XMMRegister, $src2$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7364
    __ vpmullw($tmp2$$XMMRegister, $tmp2$$XMMRegister, $dst$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7365
    __ vmovdqu($dst$$XMMRegister, ExternalAddress(vector_short_to_byte_mask()), $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7366
    __ vpbroadcastd($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7367
    __ vpand($tmp1$$XMMRegister, $tmp1$$XMMRegister, $dst$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7368
    __ vpand($tmp2$$XMMRegister, $tmp2$$XMMRegister, $dst$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7369
    __ vpackuswb($dst$$XMMRegister, $tmp1$$XMMRegister, $tmp2$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7370
    __ evmovdquq($tmp2$$XMMRegister, ExternalAddress(vector_byte_perm_mask()), vector_len, $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7371
    __ vpermq($dst$$XMMRegister, $tmp2$$XMMRegister, $dst$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7372
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7373
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7374
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7375
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  7376
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7377
// Shorts/Chars vector mul
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7378
instruct vmul2S(vecS dst, vecS src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7379
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7380
  match(Set dst (MulVS dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7381
  format %{ "pmullw $dst,$src\t! mul packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7382
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7383
    __ pmullw($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7384
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7385
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7386
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7387
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7388
instruct vmul2S_reg(vecS dst, vecS src1, vecS src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7389
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7390
  match(Set dst (MulVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7391
  format %{ "vpmullw $dst,$src1,$src2\t! mul packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7392
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7393
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7394
    __ vpmullw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7395
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7396
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7397
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7398
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7399
instruct vmul2S_mem(vecS dst, vecS src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7400
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7401
  match(Set dst (MulVS src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7402
  format %{ "vpmullw $dst,$src,$mem\t! mul packed2S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7403
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7404
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7405
    __ vpmullw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7406
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7407
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7408
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7409
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7410
instruct vmul4S(vecD dst, vecD src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7411
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7412
  match(Set dst (MulVS dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7413
  format %{ "pmullw  $dst,$src\t! mul packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7414
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7415
    __ pmullw($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7416
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7417
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7418
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7419
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7420
instruct vmul4S_reg(vecD dst, vecD src1, vecD src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7421
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7422
  match(Set dst (MulVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7423
  format %{ "vpmullw $dst,$src1,$src2\t! mul packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7424
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7425
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7426
    __ vpmullw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7427
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7428
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7429
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7430
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7431
instruct vmul4S_mem(vecD dst, vecD src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7432
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7433
  match(Set dst (MulVS src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7434
  format %{ "vpmullw $dst,$src,$mem\t! mul packed4S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7435
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7436
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7437
    __ vpmullw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7438
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7439
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7440
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7441
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7442
instruct vmul8S(vecX dst, vecX src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7443
  predicate(UseAVX == 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7444
  match(Set dst (MulVS dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7445
  format %{ "pmullw  $dst,$src\t! mul packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7446
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7447
    __ pmullw($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7448
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7449
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7450
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7451
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7452
instruct vmul8S_reg(vecX dst, vecX src1, vecX src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7453
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7454
  match(Set dst (MulVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7455
  format %{ "vpmullw $dst,$src1,$src2\t! mul packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7456
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7457
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7458
    __ vpmullw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7459
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7460
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7461
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7462
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7463
instruct vmul8S_mem(vecX dst, vecX src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7464
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7465
  match(Set dst (MulVS src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7466
  format %{ "vpmullw $dst,$src,$mem\t! mul packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7467
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7468
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7469
    __ vpmullw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7470
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7471
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7472
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7473
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7474
instruct vmul16S_reg(vecY dst, vecY src1, vecY src2) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7475
  predicate(UseAVX > 1 && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7476
  match(Set dst (MulVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7477
  format %{ "vpmullw $dst,$src1,$src2\t! mul packed16S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7478
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7479
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7480
    __ vpmullw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7481
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7482
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7483
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7484
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7485
instruct vmul16S_mem(vecY dst, vecY src, memory mem) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7486
  predicate(UseAVX > 1 && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7487
  match(Set dst (MulVS src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7488
  format %{ "vpmullw $dst,$src,$mem\t! mul packed16S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7489
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7490
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7491
    __ vpmullw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7492
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7493
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7494
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7495
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7496
instruct vmul32S_reg(vecZ dst, vecZ src1, vecZ src2) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7497
  predicate(UseAVX > 2 && VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7498
  match(Set dst (MulVS src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7499
  format %{ "vpmullw $dst,$src1,$src2\t! mul packed32S" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7500
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7501
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7502
    __ vpmullw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7503
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7504
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7505
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7506
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7507
instruct vmul32S_mem(vecZ dst, vecZ src, memory mem) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7508
  predicate(UseAVX > 2 && VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7509
  match(Set dst (MulVS src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7510
  format %{ "vpmullw $dst,$src,$mem\t! mul packed32S" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7511
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7512
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7513
    __ vpmullw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7514
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7515
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7516
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7517
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7518
// Integers vector mul (sse4_1)
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7519
instruct vmul2I(vecD dst, vecD src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7520
  predicate(UseSSE > 3 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7521
  match(Set dst (MulVI dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7522
  format %{ "pmulld  $dst,$src\t! mul packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7523
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7524
    __ pmulld($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7525
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7526
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7527
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7528
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7529
instruct vmul2I_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7530
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7531
  match(Set dst (MulVI src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7532
  format %{ "vpmulld $dst,$src1,$src2\t! mul packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7533
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7534
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7535
    __ vpmulld($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7536
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7537
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7538
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7539
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7540
instruct vmul2I_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7541
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7542
  match(Set dst (MulVI src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7543
  format %{ "vpmulld $dst,$src,$mem\t! mul packed2I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7544
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7545
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7546
    __ vpmulld($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7547
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7548
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7549
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7550
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7551
instruct vmul4I(vecX dst, vecX src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7552
  predicate(UseSSE > 3 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7553
  match(Set dst (MulVI dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7554
  format %{ "pmulld  $dst,$src\t! mul packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7555
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7556
    __ pmulld($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7557
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7558
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7559
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7560
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7561
instruct vmul4I_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7562
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7563
  match(Set dst (MulVI src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7564
  format %{ "vpmulld $dst,$src1,$src2\t! mul packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7565
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7566
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7567
    __ vpmulld($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7568
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7569
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7570
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7571
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7572
instruct vmul4I_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7573
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7574
  match(Set dst (MulVI src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7575
  format %{ "vpmulld $dst,$src,$mem\t! mul packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7576
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7577
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7578
    __ vpmulld($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7579
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7580
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7581
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7582
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7583
instruct vmul2L_reg(vecX dst, vecX src1, vecX src2) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7584
  predicate(UseAVX > 2 && n->as_Vector()->length() == 2 && VM_Version::supports_avx512dq());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7585
  match(Set dst (MulVL src1 src2));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7586
  format %{ "vpmullq $dst,$src1,$src2\t! mul packed2L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7587
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7588
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7589
    __ vpmullq($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7590
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7591
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7592
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7593
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7594
instruct vmul2L_mem(vecX dst, vecX src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7595
  predicate(UseAVX > 2 && n->as_Vector()->length() == 2 && VM_Version::supports_avx512dq());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7596
  match(Set dst (MulVL src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7597
  format %{ "vpmullq $dst,$src,$mem\t! mul packed2L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7598
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7599
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7600
    __ vpmullq($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7601
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7602
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7603
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7604
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7605
instruct vmul4L_reg(vecY dst, vecY src1, vecY src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7606
  predicate(UseAVX > 2 && n->as_Vector()->length() == 4 && VM_Version::supports_avx512dq());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7607
  match(Set dst (MulVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7608
  format %{ "vpmullq $dst,$src1,$src2\t! mul packed4L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7609
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7610
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7611
    __ vpmullq($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7612
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7613
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7614
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7615
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7616
instruct vmul4L_mem(vecY dst, vecY src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7617
  predicate(UseAVX > 2 && n->as_Vector()->length() == 4 && VM_Version::supports_avx512dq());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7618
  match(Set dst (MulVL src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7619
  format %{ "vpmullq $dst,$src,$mem\t! mul packed4L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7620
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7621
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7622
    __ vpmullq($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7623
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7624
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7625
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7626
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7627
instruct vmul8L_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7628
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8 && VM_Version::supports_avx512dq());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7629
  match(Set dst (MulVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7630
  format %{ "vpmullq $dst,$src1,$src2\t! mul packed8L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7631
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7632
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7633
    __ vpmullq($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7634
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7635
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7636
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7637
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7638
instruct vmul8L_mem(vecZ dst, vecZ src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7639
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8 && VM_Version::supports_avx512dq());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7640
  match(Set dst (MulVL src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7641
  format %{ "vpmullq $dst,$src,$mem\t! mul packed8L" %}
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7642
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7643
    int vector_len = 2;
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7644
    __ vpmullq($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7645
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7646
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7647
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7648
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7649
instruct vmul8I_reg(vecY dst, vecY src1, vecY src2) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7650
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7651
  match(Set dst (MulVI src1 src2));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7652
  format %{ "vpmulld $dst,$src1,$src2\t! mul packed8I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7653
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7654
    int vector_len = 1;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7655
    __ vpmulld($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7656
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7657
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7658
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7659
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7660
instruct vmul8I_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7661
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7662
  match(Set dst (MulVI src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7663
  format %{ "vpmulld $dst,$src,$mem\t! mul packed8I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7664
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7665
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7666
    __ vpmulld($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7667
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7668
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7669
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7670
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7671
instruct vmul16I_reg(vecZ dst, vecZ src1, vecZ src2) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7672
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7673
  match(Set dst (MulVI src1 src2));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7674
  format %{ "vpmulld $dst,$src1,$src2\t! mul packed16I" %}
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7675
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7676
    int vector_len = 2;
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7677
    __ vpmulld($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7678
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7679
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7680
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7681
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7682
instruct vmul16I_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7683
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7684
  match(Set dst (MulVI src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7685
  format %{ "vpmulld $dst,$src,$mem\t! mul packed16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7686
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7687
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7688
    __ vpmulld($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7689
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7690
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7691
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7692
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7693
// Floats vector mul
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7694
instruct vmul2F(vecD dst, vecD src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7695
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7696
  match(Set dst (MulVF dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7697
  format %{ "mulps   $dst,$src\t! mul packed2F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7698
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7699
    __ mulps($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7700
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7701
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7702
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7703
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7704
instruct vmul2F_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7705
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7706
  match(Set dst (MulVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7707
  format %{ "vmulps  $dst,$src1,$src2\t! mul packed2F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7708
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7709
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7710
    __ vmulps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7711
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7712
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7713
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7714
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7715
instruct vmul2F_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7716
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7717
  match(Set dst (MulVF src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7718
  format %{ "vmulps  $dst,$src,$mem\t! mul packed2F" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7719
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7720
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7721
    __ vmulps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7722
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7723
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7724
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7725
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7726
instruct vmul4F(vecX dst, vecX src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7727
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7728
  match(Set dst (MulVF dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7729
  format %{ "mulps   $dst,$src\t! mul packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7730
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7731
    __ mulps($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7732
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7733
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7734
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7735
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7736
instruct vmul4F_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7737
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7738
  match(Set dst (MulVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7739
  format %{ "vmulps  $dst,$src1,$src2\t! mul packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7740
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7741
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7742
    __ vmulps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7743
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7744
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7745
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7746
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7747
instruct vmul4F_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7748
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7749
  match(Set dst (MulVF src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7750
  format %{ "vmulps  $dst,$src,$mem\t! mul packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7751
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7752
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7753
    __ vmulps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7754
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7755
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7756
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7757
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7758
instruct vmul8F_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7759
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7760
  match(Set dst (MulVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7761
  format %{ "vmulps  $dst,$src1,$src2\t! mul packed8F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7762
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7763
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7764
    __ vmulps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7765
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7766
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7767
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7768
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7769
instruct vmul8F_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7770
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7771
  match(Set dst (MulVF src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7772
  format %{ "vmulps  $dst,$src,$mem\t! mul packed8F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7773
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7774
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7775
    __ vmulps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7776
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7777
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7778
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7779
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7780
instruct vmul16F_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7781
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7782
  match(Set dst (MulVF src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7783
  format %{ "vmulps  $dst,$src1,$src2\t! mul packed16F" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7784
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7785
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7786
    __ vmulps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7787
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7788
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7789
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7790
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7791
instruct vmul16F_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7792
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7793
  match(Set dst (MulVF src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7794
  format %{ "vmulps  $dst,$src,$mem\t! mul packed16F" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7795
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7796
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7797
    __ vmulps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7798
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7799
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7800
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7801
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7802
// Doubles vector mul
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7803
instruct vmul2D(vecX dst, vecX src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7804
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7805
  match(Set dst (MulVD dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7806
  format %{ "mulpd   $dst,$src\t! mul packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7807
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7808
    __ mulpd($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7809
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7810
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7811
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7812
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7813
instruct vmul2D_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7814
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7815
  match(Set dst (MulVD src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7816
  format %{ "vmulpd  $dst,$src1,$src2\t! mul packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7817
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7818
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7819
    __ vmulpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7820
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7821
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7822
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7823
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7824
instruct vmul2D_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7825
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7826
  match(Set dst (MulVD src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7827
  format %{ "vmulpd  $dst,$src,$mem\t! mul packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7828
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7829
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7830
    __ vmulpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7831
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7832
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7833
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7834
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7835
instruct vmul4D_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7836
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7837
  match(Set dst (MulVD src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7838
  format %{ "vmulpd  $dst,$src1,$src2\t! mul packed4D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7839
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7840
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7841
    __ vmulpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7842
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7843
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7844
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7845
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7846
instruct vmul4D_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7847
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7848
  match(Set dst (MulVD src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7849
  format %{ "vmulpd  $dst,$src,$mem\t! mul packed4D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7850
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7851
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7852
    __ vmulpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7853
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7854
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7855
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7856
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7857
instruct vmul8D_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7858
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7859
  match(Set dst (MulVD src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7860
  format %{ "vmulpd  $dst k0,$src1,$src2\t! mul packed8D" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7861
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7862
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7863
    __ vmulpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7864
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7865
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7866
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7867
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7868
instruct vmul8D_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7869
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7870
  match(Set dst (MulVD src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7871
  format %{ "vmulpd  $dst k0,$src,$mem\t! mul packed8D" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7872
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7873
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7874
    __ vmulpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7875
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7876
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7877
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7878
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7879
instruct vcmov8F_reg(legVecY dst, legVecY src1, legVecY src2, immI8 cop, cmpOp_vcmppd copnd) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7880
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
48309
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  7881
  match(Set dst (CMoveVF (Binary copnd cop) (Binary src1 src2)));
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  7882
  effect(TEMP dst, USE src1, USE src2);
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  7883
  format %{ "cmpps.$copnd  $dst, $src1, $src2  ! vcmovevf, cond=$cop\n\t"
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  7884
            "blendvps $dst,$src1,$src2,$dst ! vcmovevf\n\t"
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  7885
         %}
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  7886
  ins_encode %{
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  7887
    int vector_len = 1;
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  7888
    int cond = (Assembler::Condition)($copnd$$cmpcode);
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  7889
    __ cmpps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, cond, vector_len);
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  7890
    __ blendvps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, $dst$$XMMRegister, vector_len);
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  7891
  %}
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  7892
  ins_pipe( pipe_slow );
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  7893
%}
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  7894
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7895
instruct vcmov4D_reg(legVecY dst, legVecY src1, legVecY src2, immI8 cop, cmpOp_vcmppd copnd) %{
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7896
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
33469
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  7897
  match(Set dst (CMoveVD (Binary copnd cop) (Binary src1 src2)));
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  7898
  effect(TEMP dst, USE src1, USE src2);
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  7899
  format %{ "cmppd.$copnd  $dst, $src1, $src2  ! vcmovevd, cond=$cop\n\t"
42039
db627462f2c9 8165381: Update for x86 SHA512 using AVX2
kvn
parents: 41333
diff changeset
  7900
            "blendvpd $dst,$src1,$src2,$dst ! vcmovevd\n\t"
33469
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  7901
         %}
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  7902
  ins_encode %{
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  7903
    int vector_len = 1;
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  7904
    int cond = (Assembler::Condition)($copnd$$cmpcode);
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  7905
    __ cmppd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, cond, vector_len);
42039
db627462f2c9 8165381: Update for x86 SHA512 using AVX2
kvn
parents: 41333
diff changeset
  7906
    __ blendvpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, $dst$$XMMRegister, vector_len);
33469
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  7907
  %}
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  7908
  ins_pipe( pipe_slow );
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  7909
%}
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  7910
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7911
// --------------------------------- DIV --------------------------------------
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7912
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7913
// Floats vector div
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7914
instruct vdiv2F(vecD dst, vecD src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7915
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7916
  match(Set dst (DivVF dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7917
  format %{ "divps   $dst,$src\t! div packed2F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7918
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7919
    __ divps($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7920
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7921
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7922
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7923
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7924
instruct vdiv2F_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7925
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7926
  match(Set dst (DivVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7927
  format %{ "vdivps  $dst,$src1,$src2\t! div packed2F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7928
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7929
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7930
    __ vdivps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7931
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7932
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7933
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7934
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7935
instruct vdiv2F_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7936
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7937
  match(Set dst (DivVF src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7938
  format %{ "vdivps  $dst,$src,$mem\t! div packed2F" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7939
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7940
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7941
    __ vdivps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7942
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7943
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7944
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7945
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7946
instruct vdiv4F(vecX dst, vecX src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  7947
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7948
  match(Set dst (DivVF dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7949
  format %{ "divps   $dst,$src\t! div packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7950
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7951
    __ divps($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7952
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7953
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7954
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7955
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7956
instruct vdiv4F_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7957
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7958
  match(Set dst (DivVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7959
  format %{ "vdivps  $dst,$src1,$src2\t! div packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7960
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7961
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7962
    __ vdivps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7963
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7964
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7965
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7966
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7967
instruct vdiv4F_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7968
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7969
  match(Set dst (DivVF src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7970
  format %{ "vdivps  $dst,$src,$mem\t! div packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7971
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7972
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7973
    __ vdivps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7974
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7975
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7976
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7977
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7978
instruct vdiv8F_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7979
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7980
  match(Set dst (DivVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7981
  format %{ "vdivps  $dst,$src1,$src2\t! div packed8F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7982
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7983
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7984
    __ vdivps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7985
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7986
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7987
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7988
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7989
instruct vdiv8F_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7990
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7991
  match(Set dst (DivVF src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7992
  format %{ "vdivps  $dst,$src,$mem\t! div packed8F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7993
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7994
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7995
    __ vdivps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7996
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7997
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7998
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7999
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8000
instruct vdiv16F_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8001
  predicate(UseAVX > 0 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8002
  match(Set dst (DivVF src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8003
  format %{ "vdivps  $dst,$src1,$src2\t! div packed16F" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8004
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8005
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8006
    __ vdivps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8007
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8008
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8009
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8010
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8011
instruct vdiv16F_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8012
  predicate(UseAVX > 0 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8013
  match(Set dst (DivVF src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8014
  format %{ "vdivps  $dst,$src,$mem\t! div packed16F" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8015
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8016
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8017
    __ vdivps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8018
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8019
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8020
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8021
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8022
// Doubles vector div
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8023
instruct vdiv2D(vecX dst, vecX src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  8024
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8025
  match(Set dst (DivVD dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8026
  format %{ "divpd   $dst,$src\t! div packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8027
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8028
    __ divpd($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8029
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8030
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8031
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8032
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8033
instruct vdiv2D_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8034
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8035
  match(Set dst (DivVD src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8036
  format %{ "vdivpd  $dst,$src1,$src2\t! div packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8037
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8038
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8039
    __ vdivpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8040
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8041
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8042
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8043
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8044
instruct vdiv2D_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8045
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8046
  match(Set dst (DivVD src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8047
  format %{ "vdivpd  $dst,$src,$mem\t! div packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8048
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8049
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8050
    __ vdivpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8051
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8052
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8053
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8054
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8055
instruct vdiv4D_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8056
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8057
  match(Set dst (DivVD src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8058
  format %{ "vdivpd  $dst,$src1,$src2\t! div packed4D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8059
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8060
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8061
    __ vdivpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8062
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8063
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8064
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8065
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8066
instruct vdiv4D_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8067
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8068
  match(Set dst (DivVD src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8069
  format %{ "vdivpd  $dst,$src,$mem\t! div packed4D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8070
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8071
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8072
    __ vdivpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8073
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8074
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8075
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8076
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8077
instruct vdiv8D_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8078
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8079
  match(Set dst (DivVD src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8080
  format %{ "vdivpd  $dst,$src1,$src2\t! div packed8D" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8081
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8082
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8083
    __ vdivpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8084
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8085
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8086
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8087
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8088
instruct vdiv8D_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8089
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8090
  match(Set dst (DivVD src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8091
  format %{ "vdivpd  $dst,$src,$mem\t! div packed8D" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8092
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8093
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8094
    __ vdivpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8095
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8096
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8097
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8098
32723
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8099
// --------------------------------- Sqrt --------------------------------------
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8100
48089
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8101
// Floating point vector sqrt
32723
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8102
instruct vsqrt2D_reg(vecX dst, vecX src) %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8103
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8104
  match(Set dst (SqrtVD src));
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8105
  format %{ "vsqrtpd  $dst,$src\t! sqrt packed2D" %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8106
  ins_encode %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8107
    int vector_len = 0;
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8108
    __ vsqrtpd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8109
  %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8110
  ins_pipe( pipe_slow );
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8111
%}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8112
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8113
instruct vsqrt2D_mem(vecX dst, memory mem) %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8114
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8115
  match(Set dst (SqrtVD (LoadVector mem)));
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8116
  format %{ "vsqrtpd  $dst,$mem\t! sqrt packed2D" %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8117
  ins_encode %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8118
    int vector_len = 0;
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8119
    __ vsqrtpd($dst$$XMMRegister, $mem$$Address, vector_len);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8120
  %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8121
  ins_pipe( pipe_slow );
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8122
%}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8123
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8124
instruct vsqrt4D_reg(vecY dst, vecY src) %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8125
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8126
  match(Set dst (SqrtVD src));
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8127
  format %{ "vsqrtpd  $dst,$src\t! sqrt packed4D" %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8128
  ins_encode %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8129
    int vector_len = 1;
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8130
    __ vsqrtpd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8131
  %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8132
  ins_pipe( pipe_slow );
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8133
%}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8134
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8135
instruct vsqrt4D_mem(vecY dst, memory mem) %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8136
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8137
  match(Set dst (SqrtVD (LoadVector mem)));
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8138
  format %{ "vsqrtpd  $dst,$mem\t! sqrt packed4D" %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8139
  ins_encode %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8140
    int vector_len = 1;
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8141
    __ vsqrtpd($dst$$XMMRegister, $mem$$Address, vector_len);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8142
  %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8143
  ins_pipe( pipe_slow );
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8144
%}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8145
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8146
instruct vsqrt8D_reg(vecZ dst, vecZ src) %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8147
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8148
  match(Set dst (SqrtVD src));
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8149
  format %{ "vsqrtpd  $dst,$src\t! sqrt packed8D" %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8150
  ins_encode %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8151
    int vector_len = 2;
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8152
    __ vsqrtpd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8153
  %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8154
  ins_pipe( pipe_slow );
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8155
%}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8156
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8157
instruct vsqrt8D_mem(vecZ dst, memory mem) %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8158
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8159
  match(Set dst (SqrtVD (LoadVector mem)));
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8160
  format %{ "vsqrtpd  $dst,$mem\t! sqrt packed8D" %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8161
  ins_encode %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8162
    int vector_len = 2;
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8163
    __ vsqrtpd($dst$$XMMRegister, $mem$$Address, vector_len);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8164
  %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8165
  ins_pipe( pipe_slow );
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8166
%}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8167
48089
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8168
instruct vsqrt2F_reg(vecD dst, vecD src) %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8169
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8170
  match(Set dst (SqrtVF src));
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8171
  format %{ "vsqrtps  $dst,$src\t! sqrt packed2F" %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8172
  ins_encode %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8173
    int vector_len = 0;
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8174
    __ vsqrtps($dst$$XMMRegister, $src$$XMMRegister, vector_len);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8175
  %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8176
  ins_pipe( pipe_slow );
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8177
%}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8178
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8179
instruct vsqrt2F_mem(vecD dst, memory mem) %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8180
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8181
  match(Set dst (SqrtVF (LoadVector mem)));
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8182
  format %{ "vsqrtps  $dst,$mem\t! sqrt packed2F" %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8183
  ins_encode %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8184
    int vector_len = 0;
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8185
    __ vsqrtps($dst$$XMMRegister, $mem$$Address, vector_len);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8186
  %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8187
  ins_pipe( pipe_slow );
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8188
%}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8189
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8190
instruct vsqrt4F_reg(vecX dst, vecX src) %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8191
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8192
  match(Set dst (SqrtVF src));
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8193
  format %{ "vsqrtps  $dst,$src\t! sqrt packed4F" %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8194
  ins_encode %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8195
    int vector_len = 0;
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8196
    __ vsqrtps($dst$$XMMRegister, $src$$XMMRegister, vector_len);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8197
  %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8198
  ins_pipe( pipe_slow );
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8199
%}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8200
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8201
instruct vsqrt4F_mem(vecX dst, memory mem) %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8202
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8203
  match(Set dst (SqrtVF (LoadVector mem)));
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8204
  format %{ "vsqrtps  $dst,$mem\t! sqrt packed4F" %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8205
  ins_encode %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8206
    int vector_len = 0;
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8207
    __ vsqrtps($dst$$XMMRegister, $mem$$Address, vector_len);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8208
  %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8209
  ins_pipe( pipe_slow );
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8210
%}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8211
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8212
instruct vsqrt8F_reg(vecY dst, vecY src) %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8213
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8214
  match(Set dst (SqrtVF src));
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8215
  format %{ "vsqrtps  $dst,$src\t! sqrt packed8F" %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8216
  ins_encode %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8217
    int vector_len = 1;
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8218
    __ vsqrtps($dst$$XMMRegister, $src$$XMMRegister, vector_len);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8219
  %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8220
  ins_pipe( pipe_slow );
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8221
%}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8222
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8223
instruct vsqrt8F_mem(vecY dst, memory mem) %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8224
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8225
  match(Set dst (SqrtVF (LoadVector mem)));
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8226
  format %{ "vsqrtps  $dst,$mem\t! sqrt packed8F" %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8227
  ins_encode %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8228
    int vector_len = 1;
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8229
    __ vsqrtps($dst$$XMMRegister, $mem$$Address, vector_len);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8230
  %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8231
  ins_pipe( pipe_slow );
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8232
%}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8233
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8234
instruct vsqrt16F_reg(vecZ dst, vecZ src) %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8235
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8236
  match(Set dst (SqrtVF src));
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8237
  format %{ "vsqrtps  $dst,$src\t! sqrt packed16F" %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8238
  ins_encode %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8239
    int vector_len = 2;
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8240
    __ vsqrtps($dst$$XMMRegister, $src$$XMMRegister, vector_len);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8241
  %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8242
  ins_pipe( pipe_slow );
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8243
%}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8244
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8245
instruct vsqrt16F_mem(vecZ dst, memory mem) %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8246
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8247
  match(Set dst (SqrtVF (LoadVector mem)));
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8248
  format %{ "vsqrtps  $dst,$mem\t! sqrt packed16F" %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8249
  ins_encode %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8250
    int vector_len = 2;
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8251
    __ vsqrtps($dst$$XMMRegister, $mem$$Address, vector_len);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8252
  %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8253
  ins_pipe( pipe_slow );
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8254
%}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8255
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8256
// ------------------------------ Shift ---------------------------------------
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8257
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8258
// Left and right shift count vectors are the same on x86
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8259
// (only lowest bits of xmm reg are used for count).
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8260
instruct vshiftcnt(vecS dst, rRegI cnt) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8261
  match(Set dst (LShiftCntV cnt));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8262
  match(Set dst (RShiftCntV cnt));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8263
  format %{ "movdl    $dst,$cnt\t! load shift count" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8264
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8265
    __ movdl($dst$$XMMRegister, $cnt$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8266
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8267
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8268
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8269
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8270
instruct vshiftcntimm(vecS dst, immI8 cnt, rRegI tmp) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8271
  match(Set dst cnt);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8272
  effect(TEMP tmp);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8273
  format %{ "movl    $tmp,$cnt\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8274
            "movdl   $dst,$tmp\t! load shift count" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8275
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8276
    __ movl($tmp$$Register, $cnt$$constant);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8277
    __ movdl($dst$$XMMRegister, $tmp$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8278
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8279
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8280
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8281
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8282
// Byte vector shift
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8283
instruct vshift4B(vecS dst, vecS src, vecS shift, vecS tmp, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8284
  predicate(UseSSE > 3 && n->as_Vector()->length() == 4);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8285
  match(Set dst (LShiftVB src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8286
  match(Set dst (RShiftVB src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8287
  match(Set dst (URShiftVB src shift));
55299
40320fb1920a 8224234: compiler/codegen/TestCharVect2.java fails in test_mulc
sviswanathan
parents: 55061
diff changeset
  8288
  effect(TEMP dst, USE src, USE shift, TEMP tmp, TEMP scratch);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8289
  format %{"vextendbw $tmp,$src\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8290
           "vshiftw   $tmp,$shift\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8291
           "movdqu    $dst,[0x00ff00ff0x00ff00ff]\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8292
           "pand      $dst,$tmp\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8293
           "packuswb  $dst,$dst\n\t ! packed4B shift" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8294
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8295
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8296
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8297
    __ vextendbw(opcode, $tmp$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8298
    __ vshiftw(opcode, $tmp$$XMMRegister, $shift$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8299
    __ movdqu($dst$$XMMRegister, ExternalAddress(vector_short_to_byte_mask()), $scratch$$Register); 
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8300
    __ pand($dst$$XMMRegister, $tmp$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8301
    __ packuswb($dst$$XMMRegister, $dst$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8302
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8303
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8304
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8305
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8306
instruct vshift8B(vecD dst, vecD src, vecS shift, vecD tmp, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8307
  predicate(UseSSE > 3 && n->as_Vector()->length() == 8);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8308
  match(Set dst (LShiftVB src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8309
  match(Set dst (RShiftVB src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8310
  match(Set dst (URShiftVB src shift));
55299
40320fb1920a 8224234: compiler/codegen/TestCharVect2.java fails in test_mulc
sviswanathan
parents: 55061
diff changeset
  8311
  effect(TEMP dst, USE src, USE shift, TEMP tmp, TEMP scratch);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8312
  format %{"vextendbw $tmp,$src\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8313
           "vshiftw   $tmp,$shift\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8314
           "movdqu    $dst,[0x00ff00ff0x00ff00ff]\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8315
           "pand      $dst,$tmp\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8316
           "packuswb  $dst,$dst\n\t ! packed8B shift" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8317
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8318
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8319
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8320
    __ vextendbw(opcode, $tmp$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8321
    __ vshiftw(opcode, $tmp$$XMMRegister, $shift$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8322
    __ movdqu($dst$$XMMRegister, ExternalAddress(vector_short_to_byte_mask()), $scratch$$Register); 
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8323
    __ pand($dst$$XMMRegister, $tmp$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8324
    __ packuswb($dst$$XMMRegister, $dst$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8325
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8326
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8327
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8328
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8329
instruct vshift16B(vecX dst, vecX src, vecS shift, vecX tmp1, vecX tmp2, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8330
  predicate(UseSSE > 3  && UseAVX <= 1 && n->as_Vector()->length() == 16);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8331
  match(Set dst (LShiftVB src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8332
  match(Set dst (RShiftVB src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8333
  match(Set dst (URShiftVB src shift));
55299
40320fb1920a 8224234: compiler/codegen/TestCharVect2.java fails in test_mulc
sviswanathan
parents: 55061
diff changeset
  8334
  effect(TEMP dst, USE src, USE shift, TEMP tmp1, TEMP tmp2, TEMP scratch);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8335
  format %{"vextendbw $tmp1,$src\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8336
           "vshiftw   $tmp1,$shift\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8337
           "pshufd    $tmp2,$src\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8338
           "vextendbw $tmp2,$tmp2\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8339
           "vshiftw   $tmp2,$shift\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8340
           "movdqu    $dst,[0x00ff00ff0x00ff00ff]\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8341
           "pand      $tmp2,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8342
           "pand      $dst,$tmp1\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8343
           "packuswb  $dst,$tmp2\n\t! packed16B shift" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8344
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8345
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8346
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8347
    __ vextendbw(opcode, $tmp1$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8348
    __ vshiftw(opcode, $tmp1$$XMMRegister, $shift$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8349
    __ pshufd($tmp2$$XMMRegister, $src$$XMMRegister, 0xE);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8350
    __ vextendbw(opcode, $tmp2$$XMMRegister, $tmp2$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8351
    __ vshiftw(opcode, $tmp2$$XMMRegister, $shift$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8352
    __ movdqu($dst$$XMMRegister, ExternalAddress(vector_short_to_byte_mask()), $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8353
    __ pand($tmp2$$XMMRegister, $dst$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8354
    __ pand($dst$$XMMRegister, $tmp1$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8355
    __ packuswb($dst$$XMMRegister, $tmp2$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8356
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8357
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8358
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8359
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8360
instruct vshift16B_avx(vecX dst, vecX src, vecS shift, vecX tmp, rRegI scratch) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  8361
  predicate(UseAVX > 1 && n->as_Vector()->length() == 16);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8362
  match(Set dst (LShiftVB src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8363
  match(Set dst (RShiftVB src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8364
  match(Set dst (URShiftVB src shift));
55299
40320fb1920a 8224234: compiler/codegen/TestCharVect2.java fails in test_mulc
sviswanathan
parents: 55061
diff changeset
  8365
  effect(TEMP dst, USE src, USE shift, TEMP tmp, TEMP scratch);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8366
  format %{"vextendbw  $tmp,$src\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8367
           "vshiftw    $tmp,$tmp,$shift\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8368
           "vpand      $tmp,$tmp,[0x00ff00ff0x00ff00ff]\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8369
           "vextracti128_high  $dst,$tmp\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8370
           "vpackuswb  $dst,$tmp,$dst\n\t! packed16B shift" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8371
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8372
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8373
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8374
    int vector_len = 1;
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8375
    __ vextendbw(opcode, $tmp$$XMMRegister, $src$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8376
    __ vshiftw(opcode, $tmp$$XMMRegister, $tmp$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8377
    __ vpand($tmp$$XMMRegister, $tmp$$XMMRegister, ExternalAddress(vector_short_to_byte_mask()), vector_len, $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8378
    __ vextracti128_high($dst$$XMMRegister, $tmp$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8379
    __ vpackuswb($dst$$XMMRegister, $tmp$$XMMRegister, $dst$$XMMRegister, 0);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8380
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8381
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8382
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8383
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8384
instruct vshift32B_avx(vecY dst, vecY src, vecS shift, vecY tmp, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8385
  predicate(UseAVX > 1 && n->as_Vector()->length() == 32);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8386
  match(Set dst (LShiftVB src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8387
  match(Set dst (RShiftVB src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8388
  match(Set dst (URShiftVB src shift));
55299
40320fb1920a 8224234: compiler/codegen/TestCharVect2.java fails in test_mulc
sviswanathan
parents: 55061
diff changeset
  8389
  effect(TEMP dst, USE src, USE shift, TEMP tmp, TEMP scratch);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8390
  format %{"vextracti128_high  $tmp,$src\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8391
           "vextendbw  $tmp,$tmp\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8392
           "vextendbw  $dst,$src\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8393
           "vshiftw    $tmp,$tmp,$shift\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8394
           "vshiftw    $dst,$dst,$shift\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8395
           "vpand      $tmp,$tmp,[0x00ff00ff0x00ff00ff]\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8396
           "vpand      $dst,$dst,[0x00ff00ff0x00ff00ff]\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8397
           "vpackuswb  $dst,$dst,$tmp\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8398
           "vpermq     $dst,$dst,0xD8\n\t! packed32B shift" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8399
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8400
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8401
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8402
    int vector_len = 1;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8403
    __ vextracti128_high($tmp$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8404
    __ vextendbw(opcode, $tmp$$XMMRegister, $tmp$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8405
    __ vextendbw(opcode, $dst$$XMMRegister, $src$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8406
    __ vshiftw(opcode, $tmp$$XMMRegister, $tmp$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8407
    __ vshiftw(opcode, $dst$$XMMRegister, $dst$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8408
    __ vpand($tmp$$XMMRegister, $tmp$$XMMRegister, ExternalAddress(vector_short_to_byte_mask()), vector_len, $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8409
    __ vpand($dst$$XMMRegister, $dst$$XMMRegister, ExternalAddress(vector_short_to_byte_mask()), vector_len, $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8410
    __ vpackuswb($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8411
    __ vpermq($dst$$XMMRegister, $dst$$XMMRegister, 0xD8, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8412
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8413
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8414
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8415
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8416
instruct vshift64B_avx(vecZ dst, vecZ src, vecS shift, vecZ tmp1, vecZ tmp2, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8417
  predicate(UseAVX > 2 && n->as_Vector()->length() == 64);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8418
  match(Set dst (LShiftVB src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8419
  match(Set dst (RShiftVB src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8420
  match(Set dst (URShiftVB src shift));
55299
40320fb1920a 8224234: compiler/codegen/TestCharVect2.java fails in test_mulc
sviswanathan
parents: 55061
diff changeset
  8421
  effect(TEMP dst, USE src, USE shift, TEMP tmp1, TEMP tmp2, TEMP scratch);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8422
  format %{"vextracti64x4  $tmp1,$src\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8423
           "vextendbw      $tmp1,$tmp1\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8424
           "vextendbw      $tmp2,$src\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8425
           "vshiftw        $tmp1,$tmp1,$shift\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8426
           "vshiftw        $tmp2,$tmp2,$shift\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8427
           "vmovdqu        $dst,[0x00ff00ff0x00ff00ff]\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8428
           "vpbroadcastd   $dst,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8429
           "vpand          $tmp1,$tmp1,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8430
           "vpand          $tmp2,$tmp2,$dst\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8431
           "vpackuswb      $dst,$tmp1,$tmp2\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8432
           "evmovdquq      $tmp2, [0x0604020007050301]\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8433
           "vpermq         $dst,$tmp2,$dst\n\t! packed64B shift" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8434
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8435
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8436
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8437
    int vector_len = 2;
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8438
    __ vextracti64x4($tmp1$$XMMRegister, $src$$XMMRegister, 1);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8439
    __ vextendbw(opcode, $tmp1$$XMMRegister, $tmp1$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8440
    __ vextendbw(opcode, $tmp2$$XMMRegister, $src$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8441
    __ vshiftw(opcode, $tmp1$$XMMRegister, $tmp1$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8442
    __ vshiftw(opcode, $tmp2$$XMMRegister, $tmp2$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8443
    __ vmovdqu($dst$$XMMRegister, ExternalAddress(vector_short_to_byte_mask()), $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8444
    __ vpbroadcastd($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8445
    __ vpand($tmp1$$XMMRegister, $tmp1$$XMMRegister, $dst$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8446
    __ vpand($tmp2$$XMMRegister, $tmp2$$XMMRegister, $dst$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8447
    __ vpackuswb($dst$$XMMRegister, $tmp1$$XMMRegister, $tmp2$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8448
    __ evmovdquq($tmp2$$XMMRegister, ExternalAddress(vector_byte_perm_mask()), vector_len, $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8449
    __ vpermq($dst$$XMMRegister, $tmp2$$XMMRegister, $dst$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8450
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8451
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8452
%}
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8453
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  8454
// Shorts vector logical right shift produces incorrect Java result
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8455
// for negative data because java code convert short value into int with
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  8456
// sign extension before a shift. But char vectors are fine since chars are
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  8457
// unsigned values.
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8458
// Shorts/Chars vector left shift
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8459
instruct vshist2S(vecS dst, vecS src, vecS shift) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8460
  predicate(n->as_Vector()->length() == 2);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8461
  match(Set dst (LShiftVS src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8462
  match(Set dst (RShiftVS src shift));
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  8463
  match(Set dst (URShiftVS src shift));
55299
40320fb1920a 8224234: compiler/codegen/TestCharVect2.java fails in test_mulc
sviswanathan
parents: 55061
diff changeset
  8464
  effect(TEMP dst, USE src, USE shift);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8465
  format %{ "vshiftw  $dst,$src,$shift\t! shift packed2S" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8466
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8467
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8468
    if (UseAVX == 0) { 
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8469
      if ($dst$$XMMRegister != $src$$XMMRegister)
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8470
         __ movflt($dst$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8471
      __ vshiftw(opcode, $dst$$XMMRegister, $shift$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8472
    } else {
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8473
      int vector_len = 0;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8474
      __ vshiftw(opcode, $dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8475
    }
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8476
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8477
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8478
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8479
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8480
instruct vshift4S(vecD dst, vecD src, vecS shift) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8481
  predicate(n->as_Vector()->length() == 4);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8482
  match(Set dst (LShiftVS src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8483
  match(Set dst (RShiftVS src shift));
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  8484
  match(Set dst (URShiftVS src shift));
55299
40320fb1920a 8224234: compiler/codegen/TestCharVect2.java fails in test_mulc
sviswanathan
parents: 55061
diff changeset
  8485
  effect(TEMP dst, USE src, USE shift);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8486
  format %{ "vshiftw  $dst,$src,$shift\t! shift packed4S" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8487
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8488
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8489
    if (UseAVX == 0) { 
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8490
      if ($dst$$XMMRegister != $src$$XMMRegister)
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8491
         __ movdbl($dst$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8492
      __ vshiftw(opcode, $dst$$XMMRegister, $shift$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8493
    
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8494
    } else {
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8495
      int vector_len = 0;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8496
      __ vshiftw(opcode, $dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8497
    }
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8498
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8499
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8500
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8501
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8502
instruct vshift8S(vecX dst, vecX src, vecS shift) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8503
  predicate(n->as_Vector()->length() == 8);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8504
  match(Set dst (LShiftVS src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8505
  match(Set dst (RShiftVS src shift));
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  8506
  match(Set dst (URShiftVS src shift));
55299
40320fb1920a 8224234: compiler/codegen/TestCharVect2.java fails in test_mulc
sviswanathan
parents: 55061
diff changeset
  8507
  effect(TEMP dst, USE src, USE shift);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8508
  format %{ "vshiftw  $dst,$src,$shift\t! shift packed8S" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8509
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8510
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8511
    if (UseAVX == 0) { 
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8512
      if ($dst$$XMMRegister != $src$$XMMRegister)
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8513
         __ movdqu($dst$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8514
      __ vshiftw(opcode, $dst$$XMMRegister, $shift$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8515
    } else {
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8516
      int vector_len = 0;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8517
      __ vshiftw(opcode, $dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8518
    }
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8519
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8520
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8521
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8522
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8523
instruct vshift16S(vecY dst, vecY src, vecS shift) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8524
  predicate(UseAVX > 1 && n->as_Vector()->length() == 16);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8525
  match(Set dst (LShiftVS src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8526
  match(Set dst (RShiftVS src shift));
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  8527
  match(Set dst (URShiftVS src shift));
55299
40320fb1920a 8224234: compiler/codegen/TestCharVect2.java fails in test_mulc
sviswanathan
parents: 55061
diff changeset
  8528
  effect(DEF dst, USE src, USE shift);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8529
  format %{ "vshiftw  $dst,$src,$shift\t! shift packed16S" %}
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  8530
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8531
    int vector_len = 1;
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8532
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8533
    __ vshiftw(opcode, $dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8534
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8535
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8536
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8537
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8538
instruct vshift32S(vecZ dst, vecZ src, vecS shift) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8539
  predicate(UseAVX > 2 && VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8540
  match(Set dst (LShiftVS src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8541
  match(Set dst (RShiftVS src shift));
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  8542
  match(Set dst (URShiftVS src shift));
55299
40320fb1920a 8224234: compiler/codegen/TestCharVect2.java fails in test_mulc
sviswanathan
parents: 55061
diff changeset
  8543
  effect(DEF dst, USE src, USE shift);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8544
  format %{ "vshiftw  $dst,$src,$shift\t! shift packed32S" %}
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8545
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8546
    int vector_len = 2;
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8547
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8548
    __ vshiftw(opcode, $dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8549
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8550
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8551
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8552
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8553
// Integers vector left shift
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8554
instruct vshift2I(vecD dst, vecD src, vecS shift) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8555
  predicate(n->as_Vector()->length() == 2);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8556
  match(Set dst (LShiftVI src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8557
  match(Set dst (RShiftVI src shift));
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8558
  match(Set dst (URShiftVI src shift));
55299
40320fb1920a 8224234: compiler/codegen/TestCharVect2.java fails in test_mulc
sviswanathan
parents: 55061
diff changeset
  8559
  effect(TEMP dst, USE src, USE shift);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8560
  format %{ "vshiftd  $dst,$src,$shift\t! shift packed2I" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8561
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8562
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8563
    if (UseAVX == 0) { 
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8564
      if ($dst$$XMMRegister != $src$$XMMRegister)
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8565
         __ movdbl($dst$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8566
      __ vshiftd(opcode, $dst$$XMMRegister, $shift$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8567
    } else {
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8568
      int vector_len = 0;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8569
      __ vshiftd(opcode, $dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8570
    }
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8571
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8572
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8573
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8574
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8575
instruct vshift4I(vecX dst, vecX src, vecS shift) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8576
  predicate(n->as_Vector()->length() == 4);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8577
  match(Set dst (LShiftVI src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8578
  match(Set dst (RShiftVI src shift));
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8579
  match(Set dst (URShiftVI src shift));
55299
40320fb1920a 8224234: compiler/codegen/TestCharVect2.java fails in test_mulc
sviswanathan
parents: 55061
diff changeset
  8580
  effect(TEMP dst, USE src, USE shift);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8581
  format %{ "vshiftd  $dst,$src,$shift\t! shift packed4I" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8582
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8583
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8584
    if (UseAVX == 0) { 
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8585
      if ($dst$$XMMRegister != $src$$XMMRegister)
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8586
         __ movdqu($dst$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8587
      __ vshiftd(opcode, $dst$$XMMRegister, $shift$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8588
    } else {
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8589
      int vector_len = 0;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8590
      __ vshiftd(opcode, $dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8591
    }
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8592
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8593
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8594
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8595
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8596
instruct vshift8I(vecY dst, vecY src, vecS shift) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8597
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8598
  match(Set dst (LShiftVI src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8599
  match(Set dst (RShiftVI src shift));
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8600
  match(Set dst (URShiftVI src shift));
55299
40320fb1920a 8224234: compiler/codegen/TestCharVect2.java fails in test_mulc
sviswanathan
parents: 55061
diff changeset
  8601
  effect(DEF dst, USE src, USE shift);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8602
  format %{ "vshiftd  $dst,$src,$shift\t! shift packed8I" %}
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8603
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8604
    int vector_len = 1;
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8605
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8606
    __ vshiftd(opcode, $dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8607
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8608
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8609
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8610
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8611
instruct vshift16I(vecZ dst, vecZ src, vecS shift) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8612
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8613
  match(Set dst (LShiftVI src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8614
  match(Set dst (RShiftVI src shift));
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8615
  match(Set dst (URShiftVI src shift));
55299
40320fb1920a 8224234: compiler/codegen/TestCharVect2.java fails in test_mulc
sviswanathan
parents: 55061
diff changeset
  8616
  effect(DEF dst, USE src, USE shift);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8617
  format %{ "vshiftd  $dst,$src,$shift\t! shift packed16I" %}
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8618
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8619
    int vector_len = 2;
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8620
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8621
    __ vshiftd(opcode, $dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8622
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8623
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8624
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8625
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8626
// Longs vector shift
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8627
instruct vshift2L(vecX dst, vecX src, vecS shift) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8628
  predicate(n->as_Vector()->length() == 2);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8629
  match(Set dst (LShiftVL src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8630
  match(Set dst (URShiftVL src shift));
55299
40320fb1920a 8224234: compiler/codegen/TestCharVect2.java fails in test_mulc
sviswanathan
parents: 55061
diff changeset
  8631
  effect(TEMP dst, USE src, USE shift);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8632
  format %{ "vshiftq  $dst,$src,$shift\t! shift packed2L" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8633
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8634
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8635
    if (UseAVX == 0) { 
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8636
      if ($dst$$XMMRegister != $src$$XMMRegister)
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8637
         __ movdqu($dst$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8638
      __ vshiftq(opcode, $dst$$XMMRegister, $shift$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8639
    } else {
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8640
      int vector_len = 0;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8641
      __ vshiftq(opcode, $dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8642
    }
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8643
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8644
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8645
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8646
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8647
instruct vshift4L(vecY dst, vecY src, vecS shift) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8648
  predicate(UseAVX > 1 && n->as_Vector()->length() == 4);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8649
  match(Set dst (LShiftVL src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8650
  match(Set dst (URShiftVL src shift));
55299
40320fb1920a 8224234: compiler/codegen/TestCharVect2.java fails in test_mulc
sviswanathan
parents: 55061
diff changeset
  8651
  effect(DEF dst, USE src, USE shift);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8652
  format %{ "vshiftq  $dst,$src,$shift\t! left shift packed4L" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8653
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8654
    int vector_len = 1;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8655
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8656
    __ vshiftq(opcode, $dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8657
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8658
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8659
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8660
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8661
instruct vshift8L(vecZ dst, vecZ src, vecS shift) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8662
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8663
  match(Set dst (LShiftVL src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8664
  match(Set dst (RShiftVL src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8665
  match(Set dst (URShiftVL src shift));
55299
40320fb1920a 8224234: compiler/codegen/TestCharVect2.java fails in test_mulc
sviswanathan
parents: 55061
diff changeset
  8666
  effect(DEF dst, USE src, USE shift);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8667
  format %{ "vshiftq  $dst,$src,$shift\t! shift packed8L" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8668
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8669
    int vector_len = 2;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8670
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8671
    __ vshiftq(opcode, $dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8672
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8673
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8674
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8675
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8676
// -------------------ArithmeticRightShift -----------------------------------
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8677
// Long vector arithmetic right shift
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8678
instruct vsra2L_reg(vecX dst, vecX src, vecS shift, vecX tmp, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8679
  predicate(UseSSE >= 2 && n->as_Vector()->length() == 2);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8680
  match(Set dst (RShiftVL src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8681
  effect(TEMP dst, TEMP tmp, TEMP scratch);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8682
  format %{ "movdqu  $dst,$src\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8683
            "psrlq   $dst,$shift\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8684
            "movdqu  $tmp,[0x8000000000000000]\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8685
            "psrlq   $tmp,$shift\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8686
            "pxor    $dst,$tmp\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8687
            "psubq   $dst,$tmp\t! arithmetic right shift packed2L" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8688
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8689
    __ movdqu($dst$$XMMRegister, $src$$XMMRegister);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8690
    __ psrlq($dst$$XMMRegister, $shift$$XMMRegister);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8691
    __ movdqu($tmp$$XMMRegister, ExternalAddress(vector_long_sign_mask()), $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8692
    __ psrlq($tmp$$XMMRegister, $shift$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8693
    __ pxor($dst$$XMMRegister, $tmp$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8694
    __ psubq($dst$$XMMRegister, $tmp$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8695
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8696
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8697
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8698
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8699
instruct vsra2L_reg_evex(vecX dst, vecX src, vecS shift) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8700
  predicate(UseAVX > 2 && n->as_Vector()->length() == 2);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8701
  match(Set dst (RShiftVL src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8702
  format %{ "evpsraq  $dst,$src,$shift\t! arithmetic right shift packed2L" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8703
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8704
    int vector_len = 0;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8705
    __ evpsraq($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8706
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8707
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8708
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8709
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8710
instruct vsra4L_reg(vecY dst, vecY src, vecS shift, vecY tmp, rRegI scratch) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8711
  predicate(UseAVX > 1 && n->as_Vector()->length() == 4);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8712
  match(Set dst (RShiftVL src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8713
  effect(TEMP dst, TEMP tmp, TEMP scratch);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8714
  format %{ "vpsrlq   $dst,$src,$shift\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8715
            "vmovdqu  $tmp,[0x8000000000000000]\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8716
            "vpsrlq   $tmp,$tmp,$shift\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8717
            "vpxor    $dst,$dst,$tmp\n\t"
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8718
            "vpsubq   $dst,$dst,$tmp\t! arithmetic right shift packed4L" %}
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8719
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8720
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8721
    __ vpsrlq($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8722
    __ vmovdqu($tmp$$XMMRegister, ExternalAddress(vector_long_sign_mask()), $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8723
    __ vpsrlq($tmp$$XMMRegister, $tmp$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8724
    __ vpxor($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8725
    __ vpsubq($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8726
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8727
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8728
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8729
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8730
instruct vsra4L_reg_evex(vecY dst, vecY src, vecS shift) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8731
  predicate(UseAVX > 2 && n->as_Vector()->length() == 4);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8732
  match(Set dst (RShiftVL src shift));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8733
  format %{ "evpsraq  $dst,$src,$shift\t! arithmetic right shift packed4L" %}
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8734
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8735
    int vector_len = 1;
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8736
    __ evpsraq($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8737
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8738
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  8739
%}
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8740
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8741
// --------------------------------- AND --------------------------------------
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8742
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8743
instruct vand4B(vecS dst, vecS src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  8744
  predicate(UseAVX == 0 && n->as_Vector()->length_in_bytes() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8745
  match(Set dst (AndV dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8746
  format %{ "pand    $dst,$src\t! and vectors (4 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8747
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8748
    __ pand($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8749
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8750
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8751
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8752
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8753
instruct vand4B_reg(vecS dst, vecS src1, vecS src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8754
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8755
  match(Set dst (AndV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8756
  format %{ "vpand   $dst,$src1,$src2\t! and vectors (4 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8757
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8758
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8759
    __ vpand($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8760
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8761
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8762
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8763
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8764
instruct vand4B_mem(vecS dst, vecS src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8765
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 4);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8766
  match(Set dst (AndV src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8767
  format %{ "vpand   $dst,$src,$mem\t! and vectors (4 bytes)" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8768
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8769
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8770
    __ vpand($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8771
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8772
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8773
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8774
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8775
instruct vand8B(vecD dst, vecD src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  8776
  predicate(UseAVX == 0 && n->as_Vector()->length_in_bytes() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8777
  match(Set dst (AndV dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8778
  format %{ "pand    $dst,$src\t! and vectors (8 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8779
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8780
    __ pand($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8781
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8782
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8783
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8784
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8785
instruct vand8B_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8786
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8787
  match(Set dst (AndV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8788
  format %{ "vpand   $dst,$src1,$src2\t! and vectors (8 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8789
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8790
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8791
    __ vpand($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8792
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8793
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8794
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8795
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8796
instruct vand8B_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8797
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 8);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8798
  match(Set dst (AndV src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8799
  format %{ "vpand   $dst,$src,$mem\t! and vectors (8 bytes)" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8800
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8801
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8802
    __ vpand($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8803
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8804
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8805
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8806
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8807
instruct vand16B(vecX dst, vecX src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  8808
  predicate(UseAVX == 0 && n->as_Vector()->length_in_bytes() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8809
  match(Set dst (AndV dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8810
  format %{ "pand    $dst,$src\t! and vectors (16 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8811
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8812
    __ pand($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8813
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8814
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8815
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8816
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8817
instruct vand16B_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8818
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 16);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8819
  match(Set dst (AndV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8820
  format %{ "vpand   $dst,$src1,$src2\t! and vectors (16 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8821
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8822
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8823
    __ vpand($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8824
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8825
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8826
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8827
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8828
instruct vand16B_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8829
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 16);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8830
  match(Set dst (AndV src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8831
  format %{ "vpand   $dst,$src,$mem\t! and vectors (16 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8832
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8833
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8834
    __ vpand($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8835
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8836
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8837
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8838
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8839
instruct vand32B_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8840
  predicate(UseAVX > 1 && n->as_Vector()->length_in_bytes() == 32);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8841
  match(Set dst (AndV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8842
  format %{ "vpand   $dst,$src1,$src2\t! and vectors (32 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8843
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8844
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8845
    __ vpand($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8846
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8847
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8848
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8849
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8850
instruct vand32B_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8851
  predicate(UseAVX > 1 && n->as_Vector()->length_in_bytes() == 32);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8852
  match(Set dst (AndV src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8853
  format %{ "vpand   $dst,$src,$mem\t! and vectors (32 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8854
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8855
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8856
    __ vpand($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8857
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8858
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8859
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8860
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8861
instruct vand64B_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8862
  predicate(UseAVX > 2 && n->as_Vector()->length_in_bytes() == 64);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8863
  match(Set dst (AndV src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8864
  format %{ "vpand   $dst,$src1,$src2\t! and vectors (64 bytes)" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8865
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8866
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8867
    __ vpand($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8868
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8869
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8870
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8871
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8872
instruct vand64B_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8873
  predicate(UseAVX > 2 && n->as_Vector()->length_in_bytes() == 64);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8874
  match(Set dst (AndV src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8875
  format %{ "vpand   $dst,$src,$mem\t! and vectors (64 bytes)" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8876
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8877
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8878
    __ vpand($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8879
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8880
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8881
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8882
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8883
// --------------------------------- OR ---------------------------------------
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8884
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8885
instruct vor4B(vecS dst, vecS src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  8886
  predicate(UseAVX == 0 && n->as_Vector()->length_in_bytes() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8887
  match(Set dst (OrV dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8888
  format %{ "por     $dst,$src\t! or vectors (4 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8889
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8890
    __ por($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8891
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8892
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8893
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8894
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8895
instruct vor4B_reg(vecS dst, vecS src1, vecS src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8896
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8897
  match(Set dst (OrV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8898
  format %{ "vpor    $dst,$src1,$src2\t! or vectors (4 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8899
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8900
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8901
    __ vpor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8902
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8903
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8904
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8905
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8906
instruct vor4B_mem(vecS dst, vecS src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8907
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 4);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8908
  match(Set dst (OrV src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8909
  format %{ "vpor    $dst,$src,$mem\t! or vectors (4 bytes)" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8910
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8911
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8912
    __ vpor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8913
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8914
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8915
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8916
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8917
instruct vor8B(vecD dst, vecD src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  8918
  predicate(UseAVX == 0 && n->as_Vector()->length_in_bytes() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8919
  match(Set dst (OrV dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8920
  format %{ "por     $dst,$src\t! or vectors (8 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8921
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8922
    __ por($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8923
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8924
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8925
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8926
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8927
instruct vor8B_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8928
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8929
  match(Set dst (OrV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8930
  format %{ "vpor    $dst,$src1,$src2\t! or vectors (8 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8931
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8932
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8933
    __ vpor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8934
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8935
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8936
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8937
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8938
instruct vor8B_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8939
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 4);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8940
  match(Set dst (OrV src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8941
  format %{ "vpor    $dst,$src,$mem\t! or vectors (8 bytes)" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8942
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8943
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8944
    __ vpor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8945
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8946
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8947
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8948
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8949
instruct vor16B(vecX dst, vecX src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  8950
  predicate(UseAVX == 0 && n->as_Vector()->length_in_bytes() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8951
  match(Set dst (OrV dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8952
  format %{ "por     $dst,$src\t! or vectors (16 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8953
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8954
    __ por($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8955
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8956
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8957
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8958
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8959
instruct vor16B_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8960
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 16);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8961
  match(Set dst (OrV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8962
  format %{ "vpor    $dst,$src1,$src2\t! or vectors (16 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8963
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8964
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8965
    __ vpor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8966
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8967
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8968
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8969
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8970
instruct vor16B_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8971
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 16);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8972
  match(Set dst (OrV src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8973
  format %{ "vpor    $dst,$src,$mem\t! or vectors (16 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8974
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8975
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8976
    __ vpor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8977
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8978
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8979
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8980
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8981
instruct vor32B_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8982
  predicate(UseAVX > 1 && n->as_Vector()->length_in_bytes() == 32);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8983
  match(Set dst (OrV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8984
  format %{ "vpor    $dst,$src1,$src2\t! or vectors (32 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8985
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8986
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8987
    __ vpor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8988
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8989
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8990
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8991
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8992
instruct vor32B_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8993
  predicate(UseAVX > 1 && n->as_Vector()->length_in_bytes() == 32);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8994
  match(Set dst (OrV src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8995
  format %{ "vpor    $dst,$src,$mem\t! or vectors (32 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8996
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8997
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8998
    __ vpor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8999
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9000
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9001
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9002
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9003
instruct vor64B_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9004
  predicate(UseAVX > 2 && n->as_Vector()->length_in_bytes() == 64);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9005
  match(Set dst (OrV src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9006
  format %{ "vpor    $dst,$src1,$src2\t! or vectors (64 bytes)" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9007
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9008
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9009
    __ vpor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9010
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9011
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9012
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9013
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9014
instruct vor64B_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9015
  predicate(UseAVX > 2 && n->as_Vector()->length_in_bytes() == 64);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9016
  match(Set dst (OrV src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9017
  format %{ "vpor    $dst,$src,$mem\t! or vectors (64 bytes)" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9018
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9019
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9020
    __ vpor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9021
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9022
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9023
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9024
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9025
// --------------------------------- XOR --------------------------------------
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9026
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9027
instruct vxor4B(vecS dst, vecS src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  9028
  predicate(UseAVX == 0 && n->as_Vector()->length_in_bytes() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9029
  match(Set dst (XorV dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9030
  format %{ "pxor    $dst,$src\t! xor vectors (4 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9031
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9032
    __ pxor($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9033
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9034
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9035
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9036
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9037
instruct vxor4B_reg(vecS dst, vecS src1, vecS src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9038
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9039
  match(Set dst (XorV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9040
  format %{ "vpxor   $dst,$src1,$src2\t! xor vectors (4 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9041
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9042
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9043
    __ vpxor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9044
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9045
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9046
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9047
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9048
instruct vxor4B_mem(vecS dst, vecS src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9049
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 4);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9050
  match(Set dst (XorV src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9051
  format %{ "vpxor   $dst,$src,$mem\t! xor vectors (4 bytes)" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9052
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9053
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9054
    __ vpxor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9055
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9056
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9057
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9058
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9059
instruct vxor8B(vecD dst, vecD src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  9060
  predicate(UseAVX == 0 && n->as_Vector()->length_in_bytes() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9061
  match(Set dst (XorV dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9062
  format %{ "pxor    $dst,$src\t! xor vectors (8 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9063
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9064
    __ pxor($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9065
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9066
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9067
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9068
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9069
instruct vxor8B_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9070
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9071
  match(Set dst (XorV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9072
  format %{ "vpxor   $dst,$src1,$src2\t! xor vectors (8 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9073
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9074
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9075
    __ vpxor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9076
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9077
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9078
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9079
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9080
instruct vxor8B_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9081
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 8);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9082
  match(Set dst (XorV src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9083
  format %{ "vpxor   $dst,$src,$mem\t! xor vectors (8 bytes)" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9084
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9085
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9086
    __ vpxor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9087
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9088
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9089
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  9090
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9091
instruct vxor16B(vecX dst, vecX src) %{
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 51633
diff changeset
  9092
  predicate(UseAVX == 0 && n->as_Vector()->length_in_bytes() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9093
  match(Set dst (XorV dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9094
  format %{ "pxor    $dst,$src\t! xor vectors (16 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9095
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9096
    __ pxor($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9097
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9098
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9099
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9100
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9101
instruct vxor16B_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9102
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 16);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9103
  match(Set dst (XorV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9104
  format %{ "vpxor   $dst,$src1,$src2\t! xor vectors (16 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9105
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9106
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9107
    __ vpxor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9108
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9109
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9110
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9111
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9112
instruct vxor16B_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9113
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 16);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9114
  match(Set dst (XorV src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9115
  format %{ "vpxor   $dst,$src,$mem\t! xor vectors (16 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9116
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9117
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9118
    __ vpxor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9119
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9120
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9121
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9122
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9123
instruct vxor32B_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9124
  predicate(UseAVX > 1 && n->as_Vector()->length_in_bytes() == 32);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9125
  match(Set dst (XorV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9126
  format %{ "vpxor   $dst,$src1,$src2\t! xor vectors (32 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9127
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9128
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9129
    __ vpxor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9130
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9131
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9132
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9133
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9134
instruct vxor32B_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9135
  predicate(UseAVX > 1 && n->as_Vector()->length_in_bytes() == 32);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9136
  match(Set dst (XorV src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9137
  format %{ "vpxor   $dst,$src,$mem\t! xor vectors (32 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9138
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9139
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9140
    __ vpxor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9141
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9142
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9143
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9144
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9145
instruct vxor64B_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9146
  predicate(UseAVX > 2 && n->as_Vector()->length_in_bytes() == 64);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9147
  match(Set dst (XorV src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9148
  format %{ "vpxor   $dst,$src1,$src2\t! xor vectors (64 bytes)" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9149
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9150
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9151
    __ vpxor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9152
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9153
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9154
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9155
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9156
instruct vxor64B_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9157
  predicate(UseAVX > 2 && n->as_Vector()->length_in_bytes() == 64);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9158
  match(Set dst (XorV src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9159
  format %{ "vpxor   $dst,$src,$mem\t! xor vectors (64 bytes)" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9160
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9161
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9162
    __ vpxor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9163
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9164
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9165
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9166
54750
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9167
// --------------------------------- ABS --------------------------------------
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9168
// a = |a|
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9169
instruct vabs4B_reg(vecS dst, vecS src) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9170
  predicate(UseSSE > 2 && n->as_Vector()->length() == 4);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9171
  match(Set dst (AbsVB  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9172
  format %{ "pabsb $dst,$src\t# $dst = |$src| abs packed4B" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9173
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9174
    __ pabsb($dst$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9175
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9176
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9177
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9178
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9179
instruct vabs8B_reg(vecD dst, vecD src) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9180
  predicate(UseSSE > 2 && n->as_Vector()->length() == 8);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9181
  match(Set dst (AbsVB  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9182
  format %{ "pabsb $dst,$src\t# $dst = |$src| abs packed8B" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9183
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9184
    __ pabsb($dst$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9185
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9186
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9187
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9188
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9189
instruct vabs16B_reg(vecX dst, vecX src) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9190
  predicate(UseSSE > 2 && n->as_Vector()->length() == 16);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9191
  match(Set dst (AbsVB  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9192
  format %{ "pabsb $dst,$src\t# $dst = |$src| abs packed16B" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9193
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9194
    __ pabsb($dst$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9195
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9196
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9197
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9198
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9199
instruct vabs32B_reg(vecY dst, vecY src) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9200
  predicate(UseAVX > 1 && n->as_Vector()->length() == 32);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9201
  match(Set dst (AbsVB  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9202
  format %{ "vpabsb $dst,$src\t# $dst = |$src| abs packed32B" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9203
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9204
    int vector_len = 1;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9205
    __ vpabsb($dst$$XMMRegister, $src$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9206
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9207
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9208
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9209
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9210
instruct vabs64B_reg(vecZ dst, vecZ src) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9211
  predicate(UseAVX > 2 && n->as_Vector()->length() == 64);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9212
  match(Set dst (AbsVB  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9213
  format %{ "vpabsb $dst,$src\t# $dst = |$src| abs packed64B" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9214
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9215
    int vector_len = 2;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9216
    __ vpabsb($dst$$XMMRegister, $src$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9217
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9218
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9219
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9220
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9221
instruct vabs2S_reg(vecD dst, vecD src) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9222
  predicate(UseSSE > 2 && n->as_Vector()->length() == 2);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9223
  match(Set dst (AbsVS  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9224
  format %{ "pabsw $dst,$src\t# $dst = |$src| abs packed2S" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9225
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9226
    __ pabsw($dst$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9227
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9228
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9229
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9230
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9231
instruct vabs4S_reg(vecD dst, vecD src) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9232
  predicate(UseSSE > 2 && n->as_Vector()->length() == 4);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9233
  match(Set dst (AbsVS  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9234
  format %{ "pabsw $dst,$src\t# $dst = |$src| abs packed4S" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9235
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9236
    __ pabsw($dst$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9237
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9238
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9239
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9240
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9241
instruct vabs8S_reg(vecX dst, vecX src) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9242
  predicate(UseSSE > 2 && n->as_Vector()->length() == 8);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9243
  match(Set dst (AbsVS  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9244
  format %{ "pabsw $dst,$src\t# $dst = |$src| abs packed8S" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9245
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9246
    __ pabsw($dst$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9247
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9248
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9249
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9250
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9251
instruct vabs16S_reg(vecY dst, vecY src) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9252
  predicate(UseAVX > 1 && n->as_Vector()->length() == 16);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9253
  match(Set dst (AbsVS  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9254
  format %{ "vpabsw $dst,$src\t# $dst = |$src| abs packed16S" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9255
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9256
    int vector_len = 1;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9257
    __ vpabsw($dst$$XMMRegister, $src$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9258
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9259
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9260
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9261
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9262
instruct vabs32S_reg(vecZ dst, vecZ src) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9263
  predicate(UseAVX > 2 && n->as_Vector()->length() == 32);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9264
  match(Set dst (AbsVS  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9265
  format %{ "vpabsw $dst,$src\t# $dst = |$src| abs packed32S" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9266
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9267
    int vector_len = 2;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9268
    __ vpabsw($dst$$XMMRegister, $src$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9269
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9270
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9271
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9272
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9273
instruct vabs2I_reg(vecD dst, vecD src) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9274
  predicate(UseSSE > 2 && n->as_Vector()->length() == 2);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9275
  match(Set dst (AbsVI  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9276
  format %{ "pabsd $dst,$src\t# $dst = |$src| abs packed2I" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9277
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9278
    __ pabsd($dst$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9279
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9280
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9281
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9282
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9283
instruct vabs4I_reg(vecX dst, vecX src) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9284
  predicate(UseSSE > 2 && n->as_Vector()->length() == 4);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9285
  match(Set dst (AbsVI  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9286
  format %{ "pabsd $dst,$src\t# $dst = |$src| abs packed4I" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9287
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9288
    __ pabsd($dst$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9289
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9290
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9291
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9292
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9293
instruct vabs8I_reg(vecY dst, vecY src) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9294
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9295
  match(Set dst (AbsVI src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9296
  format %{ "vpabsd $dst,$src\t# $dst = |$src| abs packed8I" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9297
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9298
    int vector_len = 1;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9299
    __ vpabsd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9300
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9301
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9302
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9303
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9304
instruct vabs16I_reg(vecZ dst, vecZ src) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9305
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9306
  match(Set dst (AbsVI src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9307
  format %{ "vpabsd $dst,$src\t# $dst = |$src| abs packed16I" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9308
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9309
    int vector_len = 2;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9310
    __ vpabsd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9311
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9312
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9313
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9314
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9315
instruct vabs2L_reg(vecX dst, vecX src) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9316
  predicate(UseAVX > 2 && n->as_Vector()->length() == 2);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9317
  match(Set dst (AbsVL  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9318
  format %{ "evpabsq $dst,$src\t# $dst = |$src| abs packed2L" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9319
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9320
    int vector_len = 0;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9321
    __ evpabsq($dst$$XMMRegister, $src$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9322
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9323
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9324
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9325
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9326
instruct vabs4L_reg(vecY dst, vecY src) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9327
  predicate(UseAVX > 2 && n->as_Vector()->length() == 4);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9328
  match(Set dst (AbsVL  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9329
  format %{ "evpabsq $dst,$src\t# $dst = |$src| abs packed4L" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9330
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9331
    int vector_len = 1;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9332
    __ evpabsq($dst$$XMMRegister, $src$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9333
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9334
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9335
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9336
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9337
instruct vabs8L_reg(vecZ dst, vecZ src) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9338
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9339
  match(Set dst (AbsVL  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9340
  format %{ "evpabsq $dst,$src\t# $dst = |$src| abs packed8L" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9341
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9342
    int vector_len = 2;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9343
    __ evpabsq($dst$$XMMRegister, $src$$XMMRegister, vector_len);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9344
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9345
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9346
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9347
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9348
// --------------------------------- ABSNEG --------------------------------------
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9349
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9350
instruct vabsneg2D(vecX dst, vecX src, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9351
  predicate(UseSSE >= 2 && n->as_Vector()->length() == 2);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9352
  match(Set dst (AbsVD  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9353
  match(Set dst (NegVD  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9354
  effect(TEMP scratch);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9355
  format %{ "vabsnegd $dst,$src,[mask]\t# absneg packed2D" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9356
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9357
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9358
    if ($dst$$XMMRegister != $src$$XMMRegister)
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9359
      __ movdqu($dst$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9360
    __ vabsnegd(opcode, $dst$$XMMRegister, $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9361
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9362
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9363
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9364
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9365
instruct vabsneg4D(vecY dst, vecY src, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9366
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9367
  match(Set dst (AbsVD  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9368
  match(Set dst (NegVD  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9369
  effect(TEMP scratch);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9370
  format %{ "vabsnegd $dst,$src,[mask]\t# absneg packed4D" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9371
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9372
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9373
    int vector_len = 1;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9374
    __ vabsnegd(opcode, $dst$$XMMRegister, $src$$XMMRegister, vector_len, $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9375
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9376
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9377
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9378
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9379
instruct vabsneg8D(vecZ dst, vecZ src, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9380
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9381
  match(Set dst (AbsVD  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9382
  match(Set dst (NegVD  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9383
  effect(TEMP scratch);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9384
  format %{ "vabsnegd $dst,$src,[mask]\t# absneg packed8D" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9385
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9386
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9387
    int vector_len = 2;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9388
    __ vabsnegd(opcode, $dst$$XMMRegister, $src$$XMMRegister, vector_len, $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9389
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9390
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9391
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9392
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9393
instruct vabsneg2F(vecD dst, vecD src, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9394
  predicate(UseSSE > 0 && n->as_Vector()->length() == 2);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9395
  match(Set dst (AbsVF  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9396
  match(Set dst (NegVF  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9397
  effect(TEMP scratch);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9398
  format %{ "vabsnegf $dst,$src,[mask]\t# absneg packed2F" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9399
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9400
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9401
    if ($dst$$XMMRegister != $src$$XMMRegister)
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9402
      __ movdqu($dst$$XMMRegister, $src$$XMMRegister);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9403
    __ vabsnegf(opcode, $dst$$XMMRegister, $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9404
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9405
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9406
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9407
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9408
instruct vabsneg4F(vecX dst, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9409
  predicate(UseSSE > 0 && n->as_Vector()->length() == 4);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9410
  match(Set dst (AbsVF  dst));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9411
  match(Set dst (NegVF  dst));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9412
  effect(TEMP scratch);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9413
  format %{ "vabsnegf $dst,[mask]\t# absneg packed4F" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9414
  ins_cost(150);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9415
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9416
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9417
    __ vabsnegf(opcode, $dst$$XMMRegister, $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9418
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9419
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9420
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9421
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9422
instruct vabsneg8F(vecY dst, vecY src, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9423
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9424
  match(Set dst (AbsVF  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9425
  match(Set dst (NegVF  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9426
  effect(TEMP scratch);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9427
  format %{ "vabsnegf $dst,$src,[mask]\t# absneg packed8F" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9428
  ins_cost(150);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9429
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9430
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9431
    int vector_len = 1;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9432
    __ vabsnegf(opcode, $dst$$XMMRegister, $src$$XMMRegister, vector_len, $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9433
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9434
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9435
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9436
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9437
instruct vabsneg16F(vecZ dst, vecZ src, rRegI scratch) %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9438
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9439
  match(Set dst (AbsVF  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9440
  match(Set dst (NegVF  src));
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9441
  effect(TEMP scratch);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9442
  format %{ "vabsnegf $dst,$src,[mask]\t# absneg packed16F" %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9443
  ins_cost(150);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9444
  ins_encode %{
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9445
    int opcode = this->as_Mach()->ideal_Opcode();
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9446
    int vector_len = 2;
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9447
    __ vabsnegf(opcode, $dst$$XMMRegister, $src$$XMMRegister, vector_len, $scratch$$Register);
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9448
  %}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9449
  ins_pipe( pipe_slow );
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9450
%}
1851a532ddfe 8222074: Enhance auto vectorization for x86
sviswanathan
parents: 54022
diff changeset
  9451
46528
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9452
// --------------------------------- FMA --------------------------------------
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9453
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9454
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9455
instruct vfma2D_reg(vecX a, vecX b, vecX c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9456
  predicate(UseFMA && n->as_Vector()->length() == 2);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9457
  match(Set c (FmaVD  c (Binary a b)));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9458
  format %{ "fmapd $a,$b,$c\t# $c = $a * $b + $c fma packed2D" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9459
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9460
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9461
    int vector_len = 0;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9462
    __ vfmad($c$$XMMRegister, $a$$XMMRegister, $b$$XMMRegister, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9463
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9464
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9465
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9466
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9467
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9468
instruct vfma2D_mem(vecX a, memory b, vecX c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9469
  predicate(UseFMA && n->as_Vector()->length() == 2);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9470
  match(Set c (FmaVD  c (Binary a (LoadVector b))));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9471
  format %{ "fmapd $a,$b,$c\t# $c = $a * $b + $c fma packed2D" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9472
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9473
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9474
    int vector_len = 0;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9475
    __ vfmad($c$$XMMRegister, $a$$XMMRegister, $b$$Address, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9476
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9477
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9478
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9479
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9480
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9481
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9482
instruct vfma4D_reg(vecY a, vecY b, vecY c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9483
  predicate(UseFMA && n->as_Vector()->length() == 4);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9484
  match(Set c (FmaVD  c (Binary a b)));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9485
  format %{ "fmapd $a,$b,$c\t# $c = $a * $b + $c fma packed4D" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9486
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9487
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9488
    int vector_len = 1;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9489
    __ vfmad($c$$XMMRegister, $a$$XMMRegister, $b$$XMMRegister, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9490
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9491
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9492
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9493
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9494
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9495
instruct vfma4D_mem(vecY a, memory b, vecY c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9496
  predicate(UseFMA && n->as_Vector()->length() == 4);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9497
  match(Set c (FmaVD  c (Binary a (LoadVector b))));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9498
  format %{ "fmapd $a,$b,$c\t# $c = $a * $b + $c fma packed4D" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9499
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9500
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9501
    int vector_len = 1;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9502
    __ vfmad($c$$XMMRegister, $a$$XMMRegister, $b$$Address, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9503
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9504
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9505
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9506
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9507
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9508
instruct vfma8D_reg(vecZ a, vecZ b, vecZ c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9509
  predicate(UseFMA && n->as_Vector()->length() == 8);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9510
  match(Set c (FmaVD  c (Binary a b)));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9511
  format %{ "fmapd $a,$b,$c\t# $c = $a * $b + $c fma packed8D" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9512
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9513
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9514
    int vector_len = 2;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9515
    __ vfmad($c$$XMMRegister, $a$$XMMRegister, $b$$XMMRegister, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9516
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9517
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9518
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9519
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9520
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9521
instruct vfma8D_mem(vecZ a, memory b, vecZ c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9522
  predicate(UseFMA && n->as_Vector()->length() == 8);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9523
  match(Set c (FmaVD  c (Binary a (LoadVector b))));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9524
  format %{ "fmapd $a,$b,$c\t# $c = $a * $b + $c fma packed8D" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9525
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9526
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9527
    int vector_len = 2;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9528
    __ vfmad($c$$XMMRegister, $a$$XMMRegister, $b$$Address, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9529
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9530
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9531
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9532
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9533
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9534
instruct vfma4F_reg(vecX a, vecX b, vecX c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9535
  predicate(UseFMA && n->as_Vector()->length() == 4);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9536
  match(Set c (FmaVF  c (Binary a b)));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9537
  format %{ "fmaps $a,$b,$c\t# $c = $a * $b + $c fma packed4F" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9538
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9539
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9540
    int vector_len = 0;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9541
    __ vfmaf($c$$XMMRegister, $a$$XMMRegister, $b$$XMMRegister, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9542
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9543
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9544
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9545
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9546
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9547
instruct vfma4F_mem(vecX a, memory b, vecX c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9548
  predicate(UseFMA && n->as_Vector()->length() == 4);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9549
  match(Set c (FmaVF  c (Binary a (LoadVector b))));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9550
  format %{ "fmaps $a,$b,$c\t# $c = $a * $b + $c fma packed4F" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9551
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9552
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9553
    int vector_len = 0;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9554
    __ vfmaf($c$$XMMRegister, $a$$XMMRegister, $b$$Address, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9555
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9556
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9557
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9558
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9559
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9560
instruct vfma8F_reg(vecY a, vecY b, vecY c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9561
  predicate(UseFMA && n->as_Vector()->length() == 8);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9562
  match(Set c (FmaVF  c (Binary a b)));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9563
  format %{ "fmaps $a,$b,$c\t# $c = $a * $b + $c fma packed8F" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9564
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9565
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9566
    int vector_len = 1;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9567
    __ vfmaf($c$$XMMRegister, $a$$XMMRegister, $b$$XMMRegister, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9568
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9569
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9570
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9571
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9572
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9573
instruct vfma8F_mem(vecY a, memory b, vecY c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9574
  predicate(UseFMA && n->as_Vector()->length() == 8);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9575
  match(Set c (FmaVF  c (Binary a (LoadVector b))));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9576
  format %{ "fmaps $a,$b,$c\t# $c = $a * $b + $c fma packed8F" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9577
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9578
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9579
    int vector_len = 1;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9580
    __ vfmaf($c$$XMMRegister, $a$$XMMRegister, $b$$Address, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9581
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9582
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9583
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9584
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9585
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9586
instruct vfma16F_reg(vecZ a, vecZ b, vecZ c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9587
  predicate(UseFMA && n->as_Vector()->length() == 16);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9588
  match(Set c (FmaVF  c (Binary a b)));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9589
  format %{ "fmaps $a,$b,$c\t# $c = $a * $b + $c fma packed16F" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9590
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9591
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9592
    int vector_len = 2;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9593
    __ vfmaf($c$$XMMRegister, $a$$XMMRegister, $b$$XMMRegister, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9594
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9595
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9596
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9597
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9598
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9599
instruct vfma16F_mem(vecZ a, memory b, vecZ c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9600
  predicate(UseFMA && n->as_Vector()->length() == 16);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9601
  match(Set c (FmaVF  c (Binary a (LoadVector b))));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9602
  format %{ "fmaps $a,$b,$c\t# $c = $a * $b + $c fma packed16F" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9603
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9604
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9605
    int vector_len = 2;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9606
    __ vfmaf($c$$XMMRegister, $a$$XMMRegister, $b$$Address, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9607
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9608
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
  9609
%}
49384
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9610
52992
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9611
// --------------------------------- Vector Multiply Add --------------------------------------
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9612
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9613
instruct smuladd4S2I_reg(vecD dst, vecD src1) %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9614
  predicate(UseSSE >= 2 && UseAVX == 0 && n->as_Vector()->length() == 2);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9615
  match(Set dst (MulAddVS2VI dst src1));
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9616
  format %{ "pmaddwd $dst,$dst,$src1\t! muladd packed4Sto2I" %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9617
  ins_encode %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9618
    __ pmaddwd($dst$$XMMRegister, $src1$$XMMRegister);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9619
  %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9620
  ins_pipe( pipe_slow );
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9621
%}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9622
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9623
instruct vmuladd4S2I_reg(vecD dst, vecD src1, vecD src2) %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9624
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9625
  match(Set dst (MulAddVS2VI src1 src2));
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9626
  format %{ "vpmaddwd $dst,$src1,$src2\t! muladd packed4Sto2I" %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9627
  ins_encode %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9628
    int vector_len = 0;
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9629
    __ vpmaddwd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9630
  %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9631
  ins_pipe( pipe_slow );
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9632
%}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9633
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9634
instruct smuladd8S4I_reg(vecX dst, vecX src1) %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9635
  predicate(UseSSE >= 2 && UseAVX == 0 && n->as_Vector()->length() == 4);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9636
  match(Set dst (MulAddVS2VI dst src1));
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9637
  format %{ "pmaddwd $dst,$dst,$src1\t! muladd packed8Sto4I" %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9638
  ins_encode %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9639
    __ pmaddwd($dst$$XMMRegister, $src1$$XMMRegister);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9640
  %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9641
  ins_pipe( pipe_slow );
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9642
%}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9643
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9644
instruct vmuladd8S4I_reg(vecX dst, vecX src1, vecX src2) %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9645
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9646
  match(Set dst (MulAddVS2VI src1 src2));
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9647
  format %{ "vpmaddwd $dst,$src1,$src2\t! muladd packed8Sto4I" %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9648
  ins_encode %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9649
    int vector_len = 0;
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9650
    __ vpmaddwd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9651
  %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9652
  ins_pipe( pipe_slow );
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9653
%}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9654
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9655
instruct vmuladd16S8I_reg(vecY dst, vecY src1, vecY src2) %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9656
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9657
  match(Set dst (MulAddVS2VI src1 src2));
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9658
  format %{ "vpmaddwd $dst,$src1,$src2\t! muladd packed16Sto8I" %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9659
  ins_encode %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9660
    int vector_len = 1;
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9661
    __ vpmaddwd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9662
  %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9663
  ins_pipe( pipe_slow );
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9664
%}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9665
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9666
instruct vmuladd32S16I_reg(vecZ dst, vecZ src1, vecZ src2) %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9667
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9668
  match(Set dst (MulAddVS2VI src1 src2));
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9669
  format %{ "vpmaddwd $dst,$src1,$src2\t! muladd packed32Sto16I" %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9670
  ins_encode %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9671
    int vector_len = 2;
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9672
    __ vpmaddwd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9673
  %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9674
  ins_pipe( pipe_slow );
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9675
%}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9676
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9677
// --------------------------------- Vector Multiply Add Add ----------------------------------
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9678
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9679
instruct vmuladdadd4S2I_reg(vecD dst, vecD src1, vecD src2) %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9680
  predicate(VM_Version::supports_vnni() && UseAVX > 2 && n->as_Vector()->length() == 2);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9681
  match(Set dst (AddVI (MulAddVS2VI src1 src2) dst));
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9682
  format %{ "evpdpwssd $dst,$src1,$src2\t! muladdadd packed4Sto2I" %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9683
  ins_encode %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9684
    int vector_len = 0;
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9685
    __ evpdpwssd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9686
  %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9687
  ins_pipe( pipe_slow );
53336
36ca868f266f 8216050: Superword optimization fails with assert(0 <= i && i < _len) failed: illegal index
vdeshpande
parents: 53171
diff changeset
  9688
  ins_cost(10);
52992
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9689
%}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9690
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9691
instruct vmuladdadd8S4I_reg(vecX dst, vecX src1, vecX src2) %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9692
  predicate(VM_Version::supports_vnni() && UseAVX > 2 && n->as_Vector()->length() == 4);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9693
  match(Set dst (AddVI (MulAddVS2VI src1 src2) dst));
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9694
  format %{ "evpdpwssd $dst,$src1,$src2\t! muladdadd packed8Sto4I" %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9695
  ins_encode %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9696
    int vector_len = 0;
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9697
    __ evpdpwssd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9698
  %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9699
  ins_pipe( pipe_slow );
53336
36ca868f266f 8216050: Superword optimization fails with assert(0 <= i && i < _len) failed: illegal index
vdeshpande
parents: 53171
diff changeset
  9700
  ins_cost(10);
52992
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9701
%}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9702
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9703
instruct vmuladdadd16S8I_reg(vecY dst, vecY src1, vecY src2) %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9704
  predicate(VM_Version::supports_vnni() && UseAVX > 2 && n->as_Vector()->length() == 8);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9705
  match(Set dst (AddVI (MulAddVS2VI src1 src2) dst));
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9706
  format %{ "evpdpwssd $dst,$src1,$src2\t! muladdadd packed16Sto8I" %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9707
  ins_encode %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9708
    int vector_len = 1;
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9709
    __ evpdpwssd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9710
  %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9711
  ins_pipe( pipe_slow );
53336
36ca868f266f 8216050: Superword optimization fails with assert(0 <= i && i < _len) failed: illegal index
vdeshpande
parents: 53171
diff changeset
  9712
  ins_cost(10);
52992
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9713
%}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9714
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9715
instruct vmuladdadd32S16I_reg(vecZ dst, vecZ src1, vecZ src2) %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9716
  predicate(VM_Version::supports_vnni() && UseAVX > 2 && n->as_Vector()->length() == 16);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9717
  match(Set dst (AddVI (MulAddVS2VI src1 src2) dst));
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9718
  format %{ "evpdpwssd $dst,$src1,$src2\t! muladdadd packed32Sto16I" %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9719
  ins_encode %{
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9720
    int vector_len = 2;
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9721
    __ evpdpwssd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9722
  %}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9723
  ins_pipe( pipe_slow );
53336
36ca868f266f 8216050: Superword optimization fails with assert(0 <= i && i < _len) failed: illegal index
vdeshpande
parents: 53171
diff changeset
  9724
  ins_cost(10);
52992
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9725
%}
4bb6e0871bf7 8214751: X86: Support for VNNI Instructions
vdeshpande
parents: 51996
diff changeset
  9726
49384
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9727
// --------------------------------- PopCount --------------------------------------
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9728
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9729
instruct vpopcount2I(vecD dst, vecD src) %{
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9730
  predicate(VM_Version::supports_vpopcntdq() && UsePopCountInstruction && n->as_Vector()->length() == 2);
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9731
  match(Set dst (PopCountVI src));
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9732
  format %{ "vpopcntd  $dst,$src\t! vector popcount packed2I" %}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9733
  ins_encode %{
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9734
    int vector_len = 0;
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9735
    __ vpopcntd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9736
  %}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9737
  ins_pipe( pipe_slow );
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9738
%}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9739
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9740
instruct vpopcount4I(vecX dst, vecX src) %{
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9741
  predicate(VM_Version::supports_vpopcntdq() && UsePopCountInstruction && n->as_Vector()->length() == 4);
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9742
  match(Set dst (PopCountVI src));
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9743
  format %{ "vpopcntd  $dst,$src\t! vector popcount packed4I" %}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9744
  ins_encode %{
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9745
    int vector_len = 0;
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9746
    __ vpopcntd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9747
  %}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9748
  ins_pipe( pipe_slow );
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9749
%}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9750
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9751
instruct vpopcount8I(vecY dst, vecY src) %{
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9752
  predicate(VM_Version::supports_vpopcntdq() && UsePopCountInstruction && n->as_Vector()->length() == 8);
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9753
  match(Set dst (PopCountVI src));
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9754
  format %{ "vpopcntd  $dst,$src\t! vector popcount packed8I" %}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9755
  ins_encode %{
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9756
    int vector_len = 1;
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9757
    __ vpopcntd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9758
  %}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9759
  ins_pipe( pipe_slow );
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9760
%}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9761
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9762
instruct vpopcount16I(vecZ dst, vecZ src) %{
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9763
  predicate(VM_Version::supports_vpopcntdq() && UsePopCountInstruction && n->as_Vector()->length() == 16);
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9764
  match(Set dst (PopCountVI src));
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9765
  format %{ "vpopcntd  $dst,$src\t! vector popcount packed16I" %}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9766
  ins_encode %{
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9767
    int vector_len = 2;
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9768
    __ vpopcntd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9769
  %}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9770
  ins_pipe( pipe_slow );
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  9771
%}