src/hotspot/cpu/x86/x86.ad
author goetz
Thu, 12 Jul 2018 16:31:28 +0200
changeset 51078 fc6cfe40e32a
parent 50525 767cdb97f103
child 51633 21154cb84d2a
permissions -rw-r--r--
8207049: Minor improvements of compiler code. Reviewed-by: kvn, mdoerr
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
     1
//
51078
fc6cfe40e32a 8207049: Minor improvements of compiler code.
goetz
parents: 50525
diff changeset
     2
// Copyright (c) 2011, 2018, Oracle and/or its affiliates. All rights reserved.
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
     3
// DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
     4
//
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
     5
// This code is free software; you can redistribute it and/or modify it
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
     6
// under the terms of the GNU General Public License version 2 only, as
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
     7
// published by the Free Software Foundation.
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
     8
//
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
     9
// This code is distributed in the hope that it will be useful, but WITHOUT
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    10
// ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    11
// FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    12
// version 2 for more details (a copy is included in the LICENSE file that
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    13
// accompanied this code).
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    14
//
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    15
// You should have received a copy of the GNU General Public License version
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    16
// 2 along with this work; if not, write to the Free Software Foundation,
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    17
// Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    18
//
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    19
// Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    20
// or visit www.oracle.com if you need additional information or have any
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    21
// questions.
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    22
//
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    23
//
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    24
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    25
// X86 Common Architecture Description File
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
    26
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    27
//----------REGISTER DEFINITION BLOCK------------------------------------------
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    28
// This information is used by the matcher and the register allocator to
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    29
// describe individual registers and classes of registers within the target
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    30
// archtecture.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    31
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    32
register %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    33
//----------Architecture Description Register Definitions----------------------
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    34
// General Registers
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    35
// "reg_def"  name ( register save type, C convention save type,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    36
//                   ideal register type, encoding );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    37
// Register Save Types:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    38
//
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    39
// NS  = No-Save:       The register allocator assumes that these registers
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    40
//                      can be used without saving upon entry to the method, &
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    41
//                      that they do not need to be saved at call sites.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    42
//
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    43
// SOC = Save-On-Call:  The register allocator assumes that these registers
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    44
//                      can be used without saving upon entry to the method,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    45
//                      but that they must be saved at call sites.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    46
//
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    47
// SOE = Save-On-Entry: The register allocator assumes that these registers
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    48
//                      must be saved before using them upon entry to the
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    49
//                      method, but they do not need to be saved at call
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    50
//                      sites.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    51
//
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    52
// AS  = Always-Save:   The register allocator assumes that these registers
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    53
//                      must be saved before using them upon entry to the
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    54
//                      method, & that they must be saved at call sites.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    55
//
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    56
// Ideal Register Type is used to determine how to save & restore a
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    57
// register.  Op_RegI will get spilled with LoadI/StoreI, Op_RegP will get
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    58
// spilled with LoadP/StoreP.  If the register supports both, use Op_RegI.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    59
//
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    60
// The encoding number is the actual bit-pattern placed into the opcodes.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    61
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    62
// XMM registers.  512-bit registers or 8 words each, labeled (a)-p.
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    63
// Word a in each register holds a Float, words ab hold a Double.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    64
// The whole registers are used in SSE4.2 version intrinsics,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    65
// array copy stubs and superword operations (see UseSSE42Intrinsics,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    66
// UseXMMForArrayCopy and UseSuperword flags).
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    67
// For pre EVEX enabled architectures:
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    68
//      XMM8-XMM15 must be encoded with REX (VEX for UseAVX)
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    69
// For EVEX enabled architectures:
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    70
//      XMM8-XMM31 must be encoded with REX (EVEX for UseAVX).
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    71
//
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    72
// Linux ABI:   No register preserved across function calls
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    73
//              XMM0-XMM7 might hold parameters
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    74
// Windows ABI: XMM6-XMM31 preserved across function calls
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    75
//              XMM0-XMM3 might hold parameters
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    76
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    77
reg_def XMM0 ( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    78
reg_def XMM0b( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    79
reg_def XMM0c( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    80
reg_def XMM0d( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    81
reg_def XMM0e( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    82
reg_def XMM0f( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    83
reg_def XMM0g( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    84
reg_def XMM0h( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    85
reg_def XMM0i( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    86
reg_def XMM0j( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    87
reg_def XMM0k( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    88
reg_def XMM0l( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    89
reg_def XMM0m( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    90
reg_def XMM0n( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    91
reg_def XMM0o( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
    92
reg_def XMM0p( SOC, SOC, Op_RegF, 0, xmm0->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    93
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
    94
reg_def XMM1 ( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    95
reg_def XMM1b( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    96
reg_def XMM1c( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    97
reg_def XMM1d( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    98
reg_def XMM1e( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
    99
reg_def XMM1f( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   100
reg_def XMM1g( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   101
reg_def XMM1h( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   102
reg_def XMM1i( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   103
reg_def XMM1j( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   104
reg_def XMM1k( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   105
reg_def XMM1l( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   106
reg_def XMM1m( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   107
reg_def XMM1n( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   108
reg_def XMM1o( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   109
reg_def XMM1p( SOC, SOC, Op_RegF, 1, xmm1->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   110
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   111
reg_def XMM2 ( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   112
reg_def XMM2b( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   113
reg_def XMM2c( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   114
reg_def XMM2d( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   115
reg_def XMM2e( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   116
reg_def XMM2f( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   117
reg_def XMM2g( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   118
reg_def XMM2h( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   119
reg_def XMM2i( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   120
reg_def XMM2j( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   121
reg_def XMM2k( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   122
reg_def XMM2l( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   123
reg_def XMM2m( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   124
reg_def XMM2n( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   125
reg_def XMM2o( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   126
reg_def XMM2p( SOC, SOC, Op_RegF, 2, xmm2->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   127
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   128
reg_def XMM3 ( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   129
reg_def XMM3b( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   130
reg_def XMM3c( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   131
reg_def XMM3d( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   132
reg_def XMM3e( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   133
reg_def XMM3f( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   134
reg_def XMM3g( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   135
reg_def XMM3h( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   136
reg_def XMM3i( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   137
reg_def XMM3j( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   138
reg_def XMM3k( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   139
reg_def XMM3l( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   140
reg_def XMM3m( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   141
reg_def XMM3n( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   142
reg_def XMM3o( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   143
reg_def XMM3p( SOC, SOC, Op_RegF, 3, xmm3->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   144
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   145
reg_def XMM4 ( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   146
reg_def XMM4b( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   147
reg_def XMM4c( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   148
reg_def XMM4d( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   149
reg_def XMM4e( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   150
reg_def XMM4f( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   151
reg_def XMM4g( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   152
reg_def XMM4h( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   153
reg_def XMM4i( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   154
reg_def XMM4j( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   155
reg_def XMM4k( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   156
reg_def XMM4l( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   157
reg_def XMM4m( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   158
reg_def XMM4n( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   159
reg_def XMM4o( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   160
reg_def XMM4p( SOC, SOC, Op_RegF, 4, xmm4->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   161
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   162
reg_def XMM5 ( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   163
reg_def XMM5b( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   164
reg_def XMM5c( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   165
reg_def XMM5d( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   166
reg_def XMM5e( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   167
reg_def XMM5f( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   168
reg_def XMM5g( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   169
reg_def XMM5h( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   170
reg_def XMM5i( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   171
reg_def XMM5j( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   172
reg_def XMM5k( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   173
reg_def XMM5l( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   174
reg_def XMM5m( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   175
reg_def XMM5n( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   176
reg_def XMM5o( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   177
reg_def XMM5p( SOC, SOC, Op_RegF, 5, xmm5->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   178
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   179
reg_def XMM6 ( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   180
reg_def XMM6b( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   181
reg_def XMM6c( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   182
reg_def XMM6d( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   183
reg_def XMM6e( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   184
reg_def XMM6f( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   185
reg_def XMM6g( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   186
reg_def XMM6h( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   187
reg_def XMM6i( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   188
reg_def XMM6j( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   189
reg_def XMM6k( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   190
reg_def XMM6l( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   191
reg_def XMM6m( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   192
reg_def XMM6n( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   193
reg_def XMM6o( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   194
reg_def XMM6p( SOC, SOC, Op_RegF, 6, xmm6->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   195
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   196
reg_def XMM7 ( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   197
reg_def XMM7b( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   198
reg_def XMM7c( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   199
reg_def XMM7d( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   200
reg_def XMM7e( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   201
reg_def XMM7f( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   202
reg_def XMM7g( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   203
reg_def XMM7h( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   204
reg_def XMM7i( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   205
reg_def XMM7j( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   206
reg_def XMM7k( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   207
reg_def XMM7l( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   208
reg_def XMM7m( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   209
reg_def XMM7n( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   210
reg_def XMM7o( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   211
reg_def XMM7p( SOC, SOC, Op_RegF, 7, xmm7->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   212
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   213
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   214
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   215
reg_def XMM8 ( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   216
reg_def XMM8b( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   217
reg_def XMM8c( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   218
reg_def XMM8d( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   219
reg_def XMM8e( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   220
reg_def XMM8f( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   221
reg_def XMM8g( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   222
reg_def XMM8h( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   223
reg_def XMM8i( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   224
reg_def XMM8j( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   225
reg_def XMM8k( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   226
reg_def XMM8l( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   227
reg_def XMM8m( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   228
reg_def XMM8n( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   229
reg_def XMM8o( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   230
reg_def XMM8p( SOC, SOC, Op_RegF, 8, xmm8->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   231
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   232
reg_def XMM9 ( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   233
reg_def XMM9b( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   234
reg_def XMM9c( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   235
reg_def XMM9d( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   236
reg_def XMM9e( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   237
reg_def XMM9f( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   238
reg_def XMM9g( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   239
reg_def XMM9h( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   240
reg_def XMM9i( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   241
reg_def XMM9j( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   242
reg_def XMM9k( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   243
reg_def XMM9l( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   244
reg_def XMM9m( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   245
reg_def XMM9n( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   246
reg_def XMM9o( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   247
reg_def XMM9p( SOC, SOC, Op_RegF, 9, xmm9->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   248
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   249
reg_def XMM10 ( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   250
reg_def XMM10b( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   251
reg_def XMM10c( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   252
reg_def XMM10d( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   253
reg_def XMM10e( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   254
reg_def XMM10f( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   255
reg_def XMM10g( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   256
reg_def XMM10h( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   257
reg_def XMM10i( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   258
reg_def XMM10j( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   259
reg_def XMM10k( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   260
reg_def XMM10l( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   261
reg_def XMM10m( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   262
reg_def XMM10n( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   263
reg_def XMM10o( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   264
reg_def XMM10p( SOC, SOC, Op_RegF, 10, xmm10->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   265
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   266
reg_def XMM11 ( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   267
reg_def XMM11b( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   268
reg_def XMM11c( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   269
reg_def XMM11d( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   270
reg_def XMM11e( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   271
reg_def XMM11f( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   272
reg_def XMM11g( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   273
reg_def XMM11h( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   274
reg_def XMM11i( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   275
reg_def XMM11j( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   276
reg_def XMM11k( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   277
reg_def XMM11l( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   278
reg_def XMM11m( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   279
reg_def XMM11n( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   280
reg_def XMM11o( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   281
reg_def XMM11p( SOC, SOC, Op_RegF, 11, xmm11->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   282
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   283
reg_def XMM12 ( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   284
reg_def XMM12b( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   285
reg_def XMM12c( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   286
reg_def XMM12d( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   287
reg_def XMM12e( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   288
reg_def XMM12f( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   289
reg_def XMM12g( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   290
reg_def XMM12h( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   291
reg_def XMM12i( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   292
reg_def XMM12j( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   293
reg_def XMM12k( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   294
reg_def XMM12l( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   295
reg_def XMM12m( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   296
reg_def XMM12n( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   297
reg_def XMM12o( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   298
reg_def XMM12p( SOC, SOC, Op_RegF, 12, xmm12->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   299
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   300
reg_def XMM13 ( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   301
reg_def XMM13b( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   302
reg_def XMM13c( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   303
reg_def XMM13d( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   304
reg_def XMM13e( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   305
reg_def XMM13f( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   306
reg_def XMM13g( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   307
reg_def XMM13h( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   308
reg_def XMM13i( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   309
reg_def XMM13j( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   310
reg_def XMM13k( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   311
reg_def XMM13l( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   312
reg_def XMM13m( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   313
reg_def XMM13n( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   314
reg_def XMM13o( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   315
reg_def XMM13p( SOC, SOC, Op_RegF, 13, xmm13->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   316
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   317
reg_def XMM14 ( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   318
reg_def XMM14b( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   319
reg_def XMM14c( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   320
reg_def XMM14d( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   321
reg_def XMM14e( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   322
reg_def XMM14f( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   323
reg_def XMM14g( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   324
reg_def XMM14h( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   325
reg_def XMM14i( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   326
reg_def XMM14j( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   327
reg_def XMM14k( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   328
reg_def XMM14l( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   329
reg_def XMM14m( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   330
reg_def XMM14n( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   331
reg_def XMM14o( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   332
reg_def XMM14p( SOC, SOC, Op_RegF, 14, xmm14->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   333
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   334
reg_def XMM15 ( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg());
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   335
reg_def XMM15b( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(1));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   336
reg_def XMM15c( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(2));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   337
reg_def XMM15d( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(3));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   338
reg_def XMM15e( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(4));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   339
reg_def XMM15f( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(5));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   340
reg_def XMM15g( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(6));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
   341
reg_def XMM15h( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(7));
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   342
reg_def XMM15i( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   343
reg_def XMM15j( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   344
reg_def XMM15k( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   345
reg_def XMM15l( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   346
reg_def XMM15m( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   347
reg_def XMM15n( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   348
reg_def XMM15o( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   349
reg_def XMM15p( SOC, SOC, Op_RegF, 15, xmm15->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   350
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   351
reg_def XMM16 ( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   352
reg_def XMM16b( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   353
reg_def XMM16c( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   354
reg_def XMM16d( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   355
reg_def XMM16e( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   356
reg_def XMM16f( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   357
reg_def XMM16g( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   358
reg_def XMM16h( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   359
reg_def XMM16i( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   360
reg_def XMM16j( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   361
reg_def XMM16k( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   362
reg_def XMM16l( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   363
reg_def XMM16m( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   364
reg_def XMM16n( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   365
reg_def XMM16o( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   366
reg_def XMM16p( SOC, SOC, Op_RegF, 16, xmm16->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   367
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   368
reg_def XMM17 ( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   369
reg_def XMM17b( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   370
reg_def XMM17c( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   371
reg_def XMM17d( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   372
reg_def XMM17e( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   373
reg_def XMM17f( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   374
reg_def XMM17g( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   375
reg_def XMM17h( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   376
reg_def XMM17i( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   377
reg_def XMM17j( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   378
reg_def XMM17k( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   379
reg_def XMM17l( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   380
reg_def XMM17m( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   381
reg_def XMM17n( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   382
reg_def XMM17o( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   383
reg_def XMM17p( SOC, SOC, Op_RegF, 17, xmm17->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   384
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   385
reg_def XMM18 ( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   386
reg_def XMM18b( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   387
reg_def XMM18c( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   388
reg_def XMM18d( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   389
reg_def XMM18e( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   390
reg_def XMM18f( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   391
reg_def XMM18g( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   392
reg_def XMM18h( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   393
reg_def XMM18i( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   394
reg_def XMM18j( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   395
reg_def XMM18k( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   396
reg_def XMM18l( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   397
reg_def XMM18m( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   398
reg_def XMM18n( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   399
reg_def XMM18o( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   400
reg_def XMM18p( SOC, SOC, Op_RegF, 18, xmm18->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   401
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   402
reg_def XMM19 ( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   403
reg_def XMM19b( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   404
reg_def XMM19c( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   405
reg_def XMM19d( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   406
reg_def XMM19e( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   407
reg_def XMM19f( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   408
reg_def XMM19g( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   409
reg_def XMM19h( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   410
reg_def XMM19i( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   411
reg_def XMM19j( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   412
reg_def XMM19k( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   413
reg_def XMM19l( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   414
reg_def XMM19m( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   415
reg_def XMM19n( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   416
reg_def XMM19o( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   417
reg_def XMM19p( SOC, SOC, Op_RegF, 19, xmm19->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   418
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   419
reg_def XMM20 ( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   420
reg_def XMM20b( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   421
reg_def XMM20c( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   422
reg_def XMM20d( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   423
reg_def XMM20e( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   424
reg_def XMM20f( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   425
reg_def XMM20g( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   426
reg_def XMM20h( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   427
reg_def XMM20i( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   428
reg_def XMM20j( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   429
reg_def XMM20k( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   430
reg_def XMM20l( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   431
reg_def XMM20m( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   432
reg_def XMM20n( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   433
reg_def XMM20o( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   434
reg_def XMM20p( SOC, SOC, Op_RegF, 20, xmm20->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   435
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   436
reg_def XMM21 ( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   437
reg_def XMM21b( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   438
reg_def XMM21c( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   439
reg_def XMM21d( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   440
reg_def XMM21e( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   441
reg_def XMM21f( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   442
reg_def XMM21g( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   443
reg_def XMM21h( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   444
reg_def XMM21i( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   445
reg_def XMM21j( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   446
reg_def XMM21k( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   447
reg_def XMM21l( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   448
reg_def XMM21m( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   449
reg_def XMM21n( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   450
reg_def XMM21o( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   451
reg_def XMM21p( SOC, SOC, Op_RegF, 21, xmm21->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   452
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   453
reg_def XMM22 ( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   454
reg_def XMM22b( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   455
reg_def XMM22c( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   456
reg_def XMM22d( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   457
reg_def XMM22e( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   458
reg_def XMM22f( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   459
reg_def XMM22g( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   460
reg_def XMM22h( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   461
reg_def XMM22i( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   462
reg_def XMM22j( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   463
reg_def XMM22k( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   464
reg_def XMM22l( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   465
reg_def XMM22m( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   466
reg_def XMM22n( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   467
reg_def XMM22o( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   468
reg_def XMM22p( SOC, SOC, Op_RegF, 22, xmm22->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   469
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   470
reg_def XMM23 ( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   471
reg_def XMM23b( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   472
reg_def XMM23c( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   473
reg_def XMM23d( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   474
reg_def XMM23e( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   475
reg_def XMM23f( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   476
reg_def XMM23g( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   477
reg_def XMM23h( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   478
reg_def XMM23i( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   479
reg_def XMM23j( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   480
reg_def XMM23k( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   481
reg_def XMM23l( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   482
reg_def XMM23m( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   483
reg_def XMM23n( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   484
reg_def XMM23o( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   485
reg_def XMM23p( SOC, SOC, Op_RegF, 23, xmm23->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   486
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   487
reg_def XMM24 ( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   488
reg_def XMM24b( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   489
reg_def XMM24c( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   490
reg_def XMM24d( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   491
reg_def XMM24e( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   492
reg_def XMM24f( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   493
reg_def XMM24g( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   494
reg_def XMM24h( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   495
reg_def XMM24i( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   496
reg_def XMM24j( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   497
reg_def XMM24k( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   498
reg_def XMM24l( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   499
reg_def XMM24m( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   500
reg_def XMM24n( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   501
reg_def XMM24o( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   502
reg_def XMM24p( SOC, SOC, Op_RegF, 24, xmm24->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   503
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   504
reg_def XMM25 ( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   505
reg_def XMM25b( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   506
reg_def XMM25c( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   507
reg_def XMM25d( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   508
reg_def XMM25e( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   509
reg_def XMM25f( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   510
reg_def XMM25g( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   511
reg_def XMM25h( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   512
reg_def XMM25i( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   513
reg_def XMM25j( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   514
reg_def XMM25k( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   515
reg_def XMM25l( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   516
reg_def XMM25m( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   517
reg_def XMM25n( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   518
reg_def XMM25o( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   519
reg_def XMM25p( SOC, SOC, Op_RegF, 25, xmm25->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   520
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   521
reg_def XMM26 ( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   522
reg_def XMM26b( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   523
reg_def XMM26c( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   524
reg_def XMM26d( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   525
reg_def XMM26e( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   526
reg_def XMM26f( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   527
reg_def XMM26g( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   528
reg_def XMM26h( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   529
reg_def XMM26i( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   530
reg_def XMM26j( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   531
reg_def XMM26k( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   532
reg_def XMM26l( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   533
reg_def XMM26m( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   534
reg_def XMM26n( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   535
reg_def XMM26o( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   536
reg_def XMM26p( SOC, SOC, Op_RegF, 26, xmm26->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   537
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   538
reg_def XMM27 ( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   539
reg_def XMM27b( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   540
reg_def XMM27c( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   541
reg_def XMM27d( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   542
reg_def XMM27e( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   543
reg_def XMM27f( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   544
reg_def XMM27g( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   545
reg_def XMM27h( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   546
reg_def XMM27i( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   547
reg_def XMM27j( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   548
reg_def XMM27k( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   549
reg_def XMM27l( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   550
reg_def XMM27m( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   551
reg_def XMM27n( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   552
reg_def XMM27o( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   553
reg_def XMM27p( SOC, SOC, Op_RegF, 27, xmm27->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   554
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   555
reg_def XMM28 ( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   556
reg_def XMM28b( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   557
reg_def XMM28c( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   558
reg_def XMM28d( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   559
reg_def XMM28e( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   560
reg_def XMM28f( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   561
reg_def XMM28g( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   562
reg_def XMM28h( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   563
reg_def XMM28i( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   564
reg_def XMM28j( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   565
reg_def XMM28k( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   566
reg_def XMM28l( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   567
reg_def XMM28m( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   568
reg_def XMM28n( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   569
reg_def XMM28o( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   570
reg_def XMM28p( SOC, SOC, Op_RegF, 28, xmm28->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   571
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   572
reg_def XMM29 ( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   573
reg_def XMM29b( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   574
reg_def XMM29c( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   575
reg_def XMM29d( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   576
reg_def XMM29e( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   577
reg_def XMM29f( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   578
reg_def XMM29g( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   579
reg_def XMM29h( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   580
reg_def XMM29i( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   581
reg_def XMM29j( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   582
reg_def XMM29k( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   583
reg_def XMM29l( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   584
reg_def XMM29m( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   585
reg_def XMM29n( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   586
reg_def XMM29o( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   587
reg_def XMM29p( SOC, SOC, Op_RegF, 29, xmm29->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   588
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   589
reg_def XMM30 ( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   590
reg_def XMM30b( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   591
reg_def XMM30c( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   592
reg_def XMM30d( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   593
reg_def XMM30e( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   594
reg_def XMM30f( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   595
reg_def XMM30g( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   596
reg_def XMM30h( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   597
reg_def XMM30i( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   598
reg_def XMM30j( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   599
reg_def XMM30k( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   600
reg_def XMM30l( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   601
reg_def XMM30m( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   602
reg_def XMM30n( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   603
reg_def XMM30o( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   604
reg_def XMM30p( SOC, SOC, Op_RegF, 30, xmm30->as_VMReg()->next(15));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   605
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   606
reg_def XMM31 ( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   607
reg_def XMM31b( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(1));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   608
reg_def XMM31c( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   609
reg_def XMM31d( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(3));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   610
reg_def XMM31e( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   611
reg_def XMM31f( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(5));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   612
reg_def XMM31g( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(6));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   613
reg_def XMM31h( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(7));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   614
reg_def XMM31i( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(8));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   615
reg_def XMM31j( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(9));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   616
reg_def XMM31k( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(10));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   617
reg_def XMM31l( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(11));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   618
reg_def XMM31m( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(12));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   619
reg_def XMM31n( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(13));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   620
reg_def XMM31o( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(14));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   621
reg_def XMM31p( SOC, SOC, Op_RegF, 31, xmm31->as_VMReg()->next(15));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   622
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   623
#endif // _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   624
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   625
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   626
reg_def RFLAGS(SOC, SOC, 0, 16, VMRegImpl::Bad());
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   627
#else
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   628
reg_def RFLAGS(SOC, SOC, 0, 8, VMRegImpl::Bad());
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   629
#endif // _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   630
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   631
alloc_class chunk1(XMM0,  XMM0b,  XMM0c,  XMM0d,  XMM0e,  XMM0f,  XMM0g,  XMM0h,  XMM0i,  XMM0j,  XMM0k,  XMM0l,  XMM0m,  XMM0n,  XMM0o,  XMM0p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   632
                   XMM1,  XMM1b,  XMM1c,  XMM1d,  XMM1e,  XMM1f,  XMM1g,  XMM1h,  XMM1i,  XMM1j,  XMM1k,  XMM1l,  XMM1m,  XMM1n,  XMM1o,  XMM1p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   633
                   XMM2,  XMM2b,  XMM2c,  XMM2d,  XMM2e,  XMM2f,  XMM2g,  XMM2h,  XMM2i,  XMM2j,  XMM2k,  XMM2l,  XMM2m,  XMM2n,  XMM2o,  XMM2p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   634
                   XMM3,  XMM3b,  XMM3c,  XMM3d,  XMM3e,  XMM3f,  XMM3g,  XMM3h,  XMM3i,  XMM3j,  XMM3k,  XMM3l,  XMM3m,  XMM3n,  XMM3o,  XMM3p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   635
                   XMM4,  XMM4b,  XMM4c,  XMM4d,  XMM4e,  XMM4f,  XMM4g,  XMM4h,  XMM4i,  XMM4j,  XMM4k,  XMM4l,  XMM4m,  XMM4n,  XMM4o,  XMM4p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   636
                   XMM5,  XMM5b,  XMM5c,  XMM5d,  XMM5e,  XMM5f,  XMM5g,  XMM5h,  XMM5i,  XMM5j,  XMM5k,  XMM5l,  XMM5m,  XMM5n,  XMM5o,  XMM5p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   637
                   XMM6,  XMM6b,  XMM6c,  XMM6d,  XMM6e,  XMM6f,  XMM6g,  XMM6h,  XMM6i,  XMM6j,  XMM6k,  XMM6l,  XMM6m,  XMM6n,  XMM6o,  XMM6p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   638
                   XMM7,  XMM7b,  XMM7c,  XMM7d,  XMM7e,  XMM7f,  XMM7g,  XMM7h,  XMM7i,  XMM7j,  XMM7k,  XMM7l,  XMM7m,  XMM7n,  XMM7o,  XMM7p
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   639
#ifdef _LP64
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   640
                  ,XMM8,  XMM8b,  XMM8c,  XMM8d,  XMM8e,  XMM8f,  XMM8g,  XMM8h,  XMM8i,  XMM8j,  XMM8k,  XMM8l,  XMM8m,  XMM8n,  XMM8o,  XMM8p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   641
                   XMM9,  XMM9b,  XMM9c,  XMM9d,  XMM9e,  XMM9f,  XMM9g,  XMM9h,  XMM9i,  XMM9j,  XMM9k,  XMM9l,  XMM9m,  XMM9n,  XMM9o,  XMM9p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   642
                   XMM10, XMM10b, XMM10c, XMM10d, XMM10e, XMM10f, XMM10g, XMM10h, XMM10i, XMM10j, XMM10k, XMM10l, XMM10m, XMM10n, XMM10o, XMM10p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   643
                   XMM11, XMM11b, XMM11c, XMM11d, XMM11e, XMM11f, XMM11g, XMM11h, XMM11i, XMM11j, XMM11k, XMM11l, XMM11m, XMM11n, XMM11o, XMM11p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   644
                   XMM12, XMM12b, XMM12c, XMM12d, XMM12e, XMM12f, XMM12g, XMM12h, XMM12i, XMM12j, XMM12k, XMM12l, XMM12m, XMM12n, XMM12o, XMM12p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   645
                   XMM13, XMM13b, XMM13c, XMM13d, XMM13e, XMM13f, XMM13g, XMM13h, XMM13i, XMM13j, XMM13k, XMM13l, XMM13m, XMM13n, XMM13o, XMM13p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   646
                   XMM14, XMM14b, XMM14c, XMM14d, XMM14e, XMM14f, XMM14g, XMM14h, XMM14i, XMM14j, XMM14k, XMM14l, XMM14m, XMM14n, XMM14o, XMM14p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   647
                   XMM15, XMM15b, XMM15c, XMM15d, XMM15e, XMM15f, XMM15g, XMM15h, XMM15i, XMM15j, XMM15k, XMM15l, XMM15m, XMM15n, XMM15o, XMM15p
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   648
                  ,XMM16, XMM16b, XMM16c, XMM16d, XMM16e, XMM16f, XMM16g, XMM16h, XMM16i, XMM16j, XMM16k, XMM16l, XMM16m, XMM16n, XMM16o, XMM16p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   649
                   XMM17, XMM17b, XMM17c, XMM17d, XMM17e, XMM17f, XMM17g, XMM17h, XMM17i, XMM17j, XMM17k, XMM17l, XMM17m, XMM17n, XMM17o, XMM17p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   650
                   XMM18, XMM18b, XMM18c, XMM18d, XMM18e, XMM18f, XMM18g, XMM18h, XMM18i, XMM18j, XMM18k, XMM18l, XMM18m, XMM18n, XMM18o, XMM18p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   651
                   XMM19, XMM19b, XMM19c, XMM19d, XMM19e, XMM19f, XMM19g, XMM19h, XMM19i, XMM19j, XMM19k, XMM19l, XMM19m, XMM19n, XMM19o, XMM19p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   652
                   XMM20, XMM20b, XMM20c, XMM20d, XMM20e, XMM20f, XMM20g, XMM20h, XMM20i, XMM20j, XMM20k, XMM20l, XMM20m, XMM20n, XMM20o, XMM20p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   653
                   XMM21, XMM21b, XMM21c, XMM21d, XMM21e, XMM21f, XMM21g, XMM21h, XMM21i, XMM21j, XMM21k, XMM21l, XMM21m, XMM21n, XMM21o, XMM21p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   654
                   XMM22, XMM22b, XMM22c, XMM22d, XMM22e, XMM22f, XMM22g, XMM22h, XMM22i, XMM22j, XMM22k, XMM22l, XMM22m, XMM22n, XMM22o, XMM22p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   655
                   XMM23, XMM23b, XMM23c, XMM23d, XMM23e, XMM23f, XMM23g, XMM23h, XMM23i, XMM23j, XMM23k, XMM23l, XMM23m, XMM23n, XMM23o, XMM23p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   656
                   XMM24, XMM24b, XMM24c, XMM24d, XMM24e, XMM24f, XMM24g, XMM24h, XMM24i, XMM24j, XMM24k, XMM24l, XMM24m, XMM24n, XMM24o, XMM24p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   657
                   XMM25, XMM25b, XMM25c, XMM25d, XMM25e, XMM25f, XMM25g, XMM25h, XMM25i, XMM25j, XMM25k, XMM25l, XMM25m, XMM25n, XMM25o, XMM25p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   658
                   XMM26, XMM26b, XMM26c, XMM26d, XMM26e, XMM26f, XMM26g, XMM26h, XMM26i, XMM26j, XMM26k, XMM26l, XMM26m, XMM26n, XMM26o, XMM26p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   659
                   XMM27, XMM27b, XMM27c, XMM27d, XMM27e, XMM27f, XMM27g, XMM27h, XMM27i, XMM27j, XMM27k, XMM27l, XMM27m, XMM27n, XMM27o, XMM27p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   660
                   XMM28, XMM28b, XMM28c, XMM28d, XMM28e, XMM28f, XMM28g, XMM28h, XMM28i, XMM28j, XMM28k, XMM28l, XMM28m, XMM28n, XMM28o, XMM28p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   661
                   XMM29, XMM29b, XMM29c, XMM29d, XMM29e, XMM29f, XMM29g, XMM29h, XMM29i, XMM29j, XMM29k, XMM29l, XMM29m, XMM29n, XMM29o, XMM29p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   662
                   XMM30, XMM30b, XMM30c, XMM30d, XMM30e, XMM30f, XMM30g, XMM30h, XMM30i, XMM30j, XMM30k, XMM30l, XMM30m, XMM30n, XMM30o, XMM30p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   663
                   XMM31, XMM31b, XMM31c, XMM31d, XMM31e, XMM31f, XMM31g, XMM31h, XMM31i, XMM31j, XMM31k, XMM31l, XMM31m, XMM31n, XMM31o, XMM31p
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   664
#endif
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   665
                      );
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   666
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   667
// flags allocation class should be last.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   668
alloc_class chunk2(RFLAGS);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   669
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   670
// Singleton class for condition codes
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   671
reg_class int_flags(RFLAGS);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   672
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   673
// Class for pre evex float registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   674
reg_class float_reg_legacy(XMM0,
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   675
                    XMM1,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   676
                    XMM2,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   677
                    XMM3,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   678
                    XMM4,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   679
                    XMM5,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   680
                    XMM6,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   681
                    XMM7
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   682
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   683
                   ,XMM8,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   684
                    XMM9,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   685
                    XMM10,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   686
                    XMM11,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   687
                    XMM12,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   688
                    XMM13,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   689
                    XMM14,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   690
                    XMM15
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   691
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   692
                    );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   693
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   694
// Class for evex float registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   695
reg_class float_reg_evex(XMM0,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   696
                    XMM1,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   697
                    XMM2,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   698
                    XMM3,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   699
                    XMM4,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   700
                    XMM5,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   701
                    XMM6,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   702
                    XMM7
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   703
#ifdef _LP64
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   704
                   ,XMM8,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   705
                    XMM9,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   706
                    XMM10,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   707
                    XMM11,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   708
                    XMM12,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   709
                    XMM13,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   710
                    XMM14,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   711
                    XMM15,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   712
                    XMM16,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   713
                    XMM17,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   714
                    XMM18,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   715
                    XMM19,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   716
                    XMM20,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   717
                    XMM21,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   718
                    XMM22,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   719
                    XMM23,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   720
                    XMM24,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   721
                    XMM25,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   722
                    XMM26,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   723
                    XMM27,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   724
                    XMM28,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   725
                    XMM29,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   726
                    XMM30,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   727
                    XMM31
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   728
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   729
                    );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   730
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   731
reg_class_dynamic float_reg(float_reg_evex, float_reg_legacy, %{ VM_Version::supports_evex() %} );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   732
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   733
// Class for pre evex double registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   734
reg_class double_reg_legacy(XMM0,  XMM0b,
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   735
                     XMM1,  XMM1b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   736
                     XMM2,  XMM2b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   737
                     XMM3,  XMM3b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   738
                     XMM4,  XMM4b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   739
                     XMM5,  XMM5b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   740
                     XMM6,  XMM6b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   741
                     XMM7,  XMM7b
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   742
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   743
                    ,XMM8,  XMM8b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   744
                     XMM9,  XMM9b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   745
                     XMM10, XMM10b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   746
                     XMM11, XMM11b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   747
                     XMM12, XMM12b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   748
                     XMM13, XMM13b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   749
                     XMM14, XMM14b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   750
                     XMM15, XMM15b
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   751
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   752
                     );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   753
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   754
// Class for evex double registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   755
reg_class double_reg_evex(XMM0,  XMM0b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   756
                     XMM1,  XMM1b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   757
                     XMM2,  XMM2b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   758
                     XMM3,  XMM3b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   759
                     XMM4,  XMM4b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   760
                     XMM5,  XMM5b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   761
                     XMM6,  XMM6b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   762
                     XMM7,  XMM7b
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   763
#ifdef _LP64
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   764
                    ,XMM8,  XMM8b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   765
                     XMM9,  XMM9b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   766
                     XMM10, XMM10b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   767
                     XMM11, XMM11b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   768
                     XMM12, XMM12b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   769
                     XMM13, XMM13b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   770
                     XMM14, XMM14b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   771
                     XMM15, XMM15b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   772
                     XMM16, XMM16b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   773
                     XMM17, XMM17b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   774
                     XMM18, XMM18b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   775
                     XMM19, XMM19b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   776
                     XMM20, XMM20b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   777
                     XMM21, XMM21b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   778
                     XMM22, XMM22b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   779
                     XMM23, XMM23b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   780
                     XMM24, XMM24b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   781
                     XMM25, XMM25b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   782
                     XMM26, XMM26b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   783
                     XMM27, XMM27b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   784
                     XMM28, XMM28b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   785
                     XMM29, XMM29b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   786
                     XMM30, XMM30b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   787
                     XMM31, XMM31b
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   788
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   789
                     );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   790
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   791
reg_class_dynamic double_reg(double_reg_evex, double_reg_legacy, %{ VM_Version::supports_evex() %} );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   792
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   793
// Class for pre evex 32bit vector registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   794
reg_class vectors_reg_legacy(XMM0,
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   795
                      XMM1,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   796
                      XMM2,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   797
                      XMM3,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   798
                      XMM4,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   799
                      XMM5,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   800
                      XMM6,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   801
                      XMM7
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   802
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   803
                     ,XMM8,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   804
                      XMM9,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   805
                      XMM10,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   806
                      XMM11,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   807
                      XMM12,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   808
                      XMM13,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   809
                      XMM14,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   810
                      XMM15
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   811
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   812
                      );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   813
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   814
// Class for evex 32bit vector registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   815
reg_class vectors_reg_evex(XMM0,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   816
                      XMM1,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   817
                      XMM2,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   818
                      XMM3,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   819
                      XMM4,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   820
                      XMM5,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   821
                      XMM6,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   822
                      XMM7
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   823
#ifdef _LP64
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   824
                     ,XMM8,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   825
                      XMM9,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   826
                      XMM10,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   827
                      XMM11,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   828
                      XMM12,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   829
                      XMM13,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   830
                      XMM14,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   831
                      XMM15,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   832
                      XMM16,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   833
                      XMM17,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   834
                      XMM18,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   835
                      XMM19,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   836
                      XMM20,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   837
                      XMM21,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   838
                      XMM22,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   839
                      XMM23,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   840
                      XMM24,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   841
                      XMM25,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   842
                      XMM26,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   843
                      XMM27,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   844
                      XMM28,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   845
                      XMM29,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   846
                      XMM30,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   847
                      XMM31
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   848
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   849
                      );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   850
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   851
reg_class_dynamic vectors_reg(vectors_reg_evex, vectors_reg_legacy, %{ VM_Version::supports_evex() %} );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   852
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   853
// Class for all 64bit vector registers
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   854
reg_class vectord_reg_legacy(XMM0,  XMM0b,
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   855
                      XMM1,  XMM1b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   856
                      XMM2,  XMM2b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   857
                      XMM3,  XMM3b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   858
                      XMM4,  XMM4b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   859
                      XMM5,  XMM5b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   860
                      XMM6,  XMM6b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   861
                      XMM7,  XMM7b
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   862
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   863
                     ,XMM8,  XMM8b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   864
                      XMM9,  XMM9b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   865
                      XMM10, XMM10b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   866
                      XMM11, XMM11b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   867
                      XMM12, XMM12b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   868
                      XMM13, XMM13b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   869
                      XMM14, XMM14b,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   870
                      XMM15, XMM15b
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   871
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   872
                      );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   873
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   874
// Class for all 64bit vector registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   875
reg_class vectord_reg_evex(XMM0,  XMM0b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   876
                      XMM1,  XMM1b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   877
                      XMM2,  XMM2b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   878
                      XMM3,  XMM3b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   879
                      XMM4,  XMM4b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   880
                      XMM5,  XMM5b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   881
                      XMM6,  XMM6b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   882
                      XMM7,  XMM7b
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   883
#ifdef _LP64
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   884
                     ,XMM8,  XMM8b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   885
                      XMM9,  XMM9b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   886
                      XMM10, XMM10b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   887
                      XMM11, XMM11b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   888
                      XMM12, XMM12b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   889
                      XMM13, XMM13b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   890
                      XMM14, XMM14b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   891
                      XMM15, XMM15b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   892
                      XMM16, XMM16b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   893
                      XMM17, XMM17b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   894
                      XMM18, XMM18b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   895
                      XMM19, XMM19b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   896
                      XMM20, XMM20b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   897
                      XMM21, XMM21b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   898
                      XMM22, XMM22b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   899
                      XMM23, XMM23b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   900
                      XMM24, XMM24b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   901
                      XMM25, XMM25b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   902
                      XMM26, XMM26b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   903
                      XMM27, XMM27b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   904
                      XMM28, XMM28b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   905
                      XMM29, XMM29b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   906
                      XMM30, XMM30b,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   907
                      XMM31, XMM31b
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   908
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   909
                      );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   910
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   911
reg_class_dynamic vectord_reg(vectord_reg_evex, vectord_reg_legacy, %{ VM_Version::supports_evex() %} );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   912
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   913
// Class for all 128bit vector registers
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   914
reg_class vectorx_reg_legacy(XMM0,  XMM0b,  XMM0c,  XMM0d,
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   915
                      XMM1,  XMM1b,  XMM1c,  XMM1d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   916
                      XMM2,  XMM2b,  XMM2c,  XMM2d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   917
                      XMM3,  XMM3b,  XMM3c,  XMM3d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   918
                      XMM4,  XMM4b,  XMM4c,  XMM4d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   919
                      XMM5,  XMM5b,  XMM5c,  XMM5d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   920
                      XMM6,  XMM6b,  XMM6c,  XMM6d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   921
                      XMM7,  XMM7b,  XMM7c,  XMM7d
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   922
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   923
                     ,XMM8,  XMM8b,  XMM8c,  XMM8d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   924
                      XMM9,  XMM9b,  XMM9c,  XMM9d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   925
                      XMM10, XMM10b, XMM10c, XMM10d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   926
                      XMM11, XMM11b, XMM11c, XMM11d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   927
                      XMM12, XMM12b, XMM12c, XMM12d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   928
                      XMM13, XMM13b, XMM13c, XMM13d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   929
                      XMM14, XMM14b, XMM14c, XMM14d,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   930
                      XMM15, XMM15b, XMM15c, XMM15d
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   931
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   932
                      );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   933
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   934
// Class for all 128bit vector registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   935
reg_class vectorx_reg_evex(XMM0,  XMM0b,  XMM0c,  XMM0d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   936
                      XMM1,  XMM1b,  XMM1c,  XMM1d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   937
                      XMM2,  XMM2b,  XMM2c,  XMM2d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   938
                      XMM3,  XMM3b,  XMM3c,  XMM3d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   939
                      XMM4,  XMM4b,  XMM4c,  XMM4d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   940
                      XMM5,  XMM5b,  XMM5c,  XMM5d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   941
                      XMM6,  XMM6b,  XMM6c,  XMM6d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   942
                      XMM7,  XMM7b,  XMM7c,  XMM7d
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   943
#ifdef _LP64
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   944
                     ,XMM8,  XMM8b,  XMM8c,  XMM8d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   945
                      XMM9,  XMM9b,  XMM9c,  XMM9d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   946
                      XMM10, XMM10b, XMM10c, XMM10d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   947
                      XMM11, XMM11b, XMM11c, XMM11d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   948
                      XMM12, XMM12b, XMM12c, XMM12d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   949
                      XMM13, XMM13b, XMM13c, XMM13d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   950
                      XMM14, XMM14b, XMM14c, XMM14d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   951
                      XMM15, XMM15b, XMM15c, XMM15d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   952
                      XMM16, XMM16b, XMM16c, XMM16d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   953
                      XMM17, XMM17b, XMM17c, XMM17d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   954
                      XMM18, XMM18b, XMM18c, XMM18d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   955
                      XMM19, XMM19b, XMM19c, XMM19d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   956
                      XMM20, XMM20b, XMM20c, XMM20d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   957
                      XMM21, XMM21b, XMM21c, XMM21d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   958
                      XMM22, XMM22b, XMM22c, XMM22d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   959
                      XMM23, XMM23b, XMM23c, XMM23d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   960
                      XMM24, XMM24b, XMM24c, XMM24d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   961
                      XMM25, XMM25b, XMM25c, XMM25d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   962
                      XMM26, XMM26b, XMM26c, XMM26d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   963
                      XMM27, XMM27b, XMM27c, XMM27d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   964
                      XMM28, XMM28b, XMM28c, XMM28d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   965
                      XMM29, XMM29b, XMM29c, XMM29d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   966
                      XMM30, XMM30b, XMM30c, XMM30d,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   967
                      XMM31, XMM31b, XMM31c, XMM31d
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   968
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   969
                      );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   970
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   971
reg_class_dynamic vectorx_reg(vectorx_reg_evex, vectorx_reg_legacy, %{ VM_Version::supports_evex() %} );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   972
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   973
// Class for all 256bit vector registers
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   974
reg_class vectory_reg_legacy(XMM0,  XMM0b,  XMM0c,  XMM0d,  XMM0e,  XMM0f,  XMM0g,  XMM0h,
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   975
                      XMM1,  XMM1b,  XMM1c,  XMM1d,  XMM1e,  XMM1f,  XMM1g,  XMM1h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   976
                      XMM2,  XMM2b,  XMM2c,  XMM2d,  XMM2e,  XMM2f,  XMM2g,  XMM2h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   977
                      XMM3,  XMM3b,  XMM3c,  XMM3d,  XMM3e,  XMM3f,  XMM3g,  XMM3h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   978
                      XMM4,  XMM4b,  XMM4c,  XMM4d,  XMM4e,  XMM4f,  XMM4g,  XMM4h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   979
                      XMM5,  XMM5b,  XMM5c,  XMM5d,  XMM5e,  XMM5f,  XMM5g,  XMM5h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   980
                      XMM6,  XMM6b,  XMM6c,  XMM6d,  XMM6e,  XMM6f,  XMM6g,  XMM6h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   981
                      XMM7,  XMM7b,  XMM7c,  XMM7d,  XMM7e,  XMM7f,  XMM7g,  XMM7h
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   982
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   983
                     ,XMM8,  XMM8b,  XMM8c,  XMM8d,  XMM8e,  XMM8f,  XMM8g,  XMM8h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   984
                      XMM9,  XMM9b,  XMM9c,  XMM9d,  XMM9e,  XMM9f,  XMM9g,  XMM9h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   985
                      XMM10, XMM10b, XMM10c, XMM10d, XMM10e, XMM10f, XMM10g, XMM10h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   986
                      XMM11, XMM11b, XMM11c, XMM11d, XMM11e, XMM11f, XMM11g, XMM11h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   987
                      XMM12, XMM12b, XMM12c, XMM12d, XMM12e, XMM12f, XMM12g, XMM12h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   988
                      XMM13, XMM13b, XMM13c, XMM13d, XMM13e, XMM13f, XMM13g, XMM13h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   989
                      XMM14, XMM14b, XMM14c, XMM14d, XMM14e, XMM14f, XMM14g, XMM14h,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   990
                      XMM15, XMM15b, XMM15c, XMM15d, XMM15e, XMM15f, XMM15g, XMM15h
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   991
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   992
                      );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
   993
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   994
// Class for all 256bit vector registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   995
reg_class vectory_reg_evex(XMM0,  XMM0b,  XMM0c,  XMM0d,  XMM0e,  XMM0f,  XMM0g,  XMM0h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   996
                      XMM1,  XMM1b,  XMM1c,  XMM1d,  XMM1e,  XMM1f,  XMM1g,  XMM1h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   997
                      XMM2,  XMM2b,  XMM2c,  XMM2d,  XMM2e,  XMM2f,  XMM2g,  XMM2h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   998
                      XMM3,  XMM3b,  XMM3c,  XMM3d,  XMM3e,  XMM3f,  XMM3g,  XMM3h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
   999
                      XMM4,  XMM4b,  XMM4c,  XMM4d,  XMM4e,  XMM4f,  XMM4g,  XMM4h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1000
                      XMM5,  XMM5b,  XMM5c,  XMM5d,  XMM5e,  XMM5f,  XMM5g,  XMM5h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1001
                      XMM6,  XMM6b,  XMM6c,  XMM6d,  XMM6e,  XMM6f,  XMM6g,  XMM6h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1002
                      XMM7,  XMM7b,  XMM7c,  XMM7d,  XMM7e,  XMM7f,  XMM7g,  XMM7h
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1003
#ifdef _LP64
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1004
                     ,XMM8,  XMM8b,  XMM8c,  XMM8d,  XMM8e,  XMM8f,  XMM8g,  XMM8h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1005
                      XMM9,  XMM9b,  XMM9c,  XMM9d,  XMM9e,  XMM9f,  XMM9g,  XMM9h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1006
                      XMM10, XMM10b, XMM10c, XMM10d, XMM10e, XMM10f, XMM10g, XMM10h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1007
                      XMM11, XMM11b, XMM11c, XMM11d, XMM11e, XMM11f, XMM11g, XMM11h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1008
                      XMM12, XMM12b, XMM12c, XMM12d, XMM12e, XMM12f, XMM12g, XMM12h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1009
                      XMM13, XMM13b, XMM13c, XMM13d, XMM13e, XMM13f, XMM13g, XMM13h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1010
                      XMM14, XMM14b, XMM14c, XMM14d, XMM14e, XMM14f, XMM14g, XMM14h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1011
                      XMM15, XMM15b, XMM15c, XMM15d, XMM15e, XMM15f, XMM15g, XMM15h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1012
                      XMM16, XMM16b, XMM16c, XMM16d, XMM16e, XMM16f, XMM16g, XMM16h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1013
                      XMM17, XMM17b, XMM17c, XMM17d, XMM17e, XMM17f, XMM17g, XMM17h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1014
                      XMM18, XMM18b, XMM18c, XMM18d, XMM18e, XMM18f, XMM18g, XMM18h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1015
                      XMM19, XMM19b, XMM19c, XMM19d, XMM19e, XMM19f, XMM19g, XMM19h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1016
                      XMM20, XMM20b, XMM20c, XMM20d, XMM20e, XMM20f, XMM20g, XMM20h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1017
                      XMM21, XMM21b, XMM21c, XMM21d, XMM21e, XMM21f, XMM21g, XMM21h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1018
                      XMM22, XMM22b, XMM22c, XMM22d, XMM22e, XMM22f, XMM22g, XMM22h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1019
                      XMM23, XMM23b, XMM23c, XMM23d, XMM23e, XMM23f, XMM23g, XMM23h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1020
                      XMM24, XMM24b, XMM24c, XMM24d, XMM24e, XMM24f, XMM24g, XMM24h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1021
                      XMM25, XMM25b, XMM25c, XMM25d, XMM25e, XMM25f, XMM25g, XMM25h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1022
                      XMM26, XMM26b, XMM26c, XMM26d, XMM26e, XMM26f, XMM26g, XMM26h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1023
                      XMM27, XMM27b, XMM27c, XMM27d, XMM27e, XMM27f, XMM27g, XMM27h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1024
                      XMM28, XMM28b, XMM28c, XMM28d, XMM28e, XMM28f, XMM28g, XMM28h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1025
                      XMM29, XMM29b, XMM29c, XMM29d, XMM29e, XMM29f, XMM29g, XMM29h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1026
                      XMM30, XMM30b, XMM30c, XMM30d, XMM30e, XMM30f, XMM30g, XMM30h,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1027
                      XMM31, XMM31b, XMM31c, XMM31d, XMM31e, XMM31f, XMM31g, XMM31h
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1028
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1029
                      );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1030
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1031
reg_class_dynamic vectory_reg(vectory_reg_evex, vectory_reg_legacy, %{ VM_Version::supports_evex() %} );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1032
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1033
// Class for all 512bit vector registers
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1034
reg_class vectorz_reg(XMM0,  XMM0b,  XMM0c,  XMM0d,  XMM0e,  XMM0f,  XMM0g,  XMM0h,  XMM0i,  XMM0j,  XMM0k,  XMM0l,  XMM0m,  XMM0n,  XMM0o,  XMM0p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1035
                      XMM1,  XMM1b,  XMM1c,  XMM1d,  XMM1e,  XMM1f,  XMM1g,  XMM1h,  XMM1i,  XMM1j,  XMM1k,  XMM1l,  XMM1m,  XMM1n,  XMM1o,  XMM1p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1036
                      XMM2,  XMM2b,  XMM2c,  XMM2d,  XMM2e,  XMM2f,  XMM2g,  XMM2h,  XMM2i,  XMM2j,  XMM2k,  XMM2l,  XMM2m,  XMM2n,  XMM2o,  XMM2p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1037
                      XMM3,  XMM3b,  XMM3c,  XMM3d,  XMM3e,  XMM3f,  XMM3g,  XMM3h,  XMM3i,  XMM3j,  XMM3k,  XMM3l,  XMM3m,  XMM3n,  XMM3o,  XMM3p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1038
                      XMM4,  XMM4b,  XMM4c,  XMM4d,  XMM4e,  XMM4f,  XMM4g,  XMM4h,  XMM4i,  XMM4j,  XMM4k,  XMM4l,  XMM4m,  XMM4n,  XMM4o,  XMM4p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1039
                      XMM5,  XMM5b,  XMM5c,  XMM5d,  XMM5e,  XMM5f,  XMM5g,  XMM5h,  XMM5i,  XMM5j,  XMM5k,  XMM5l,  XMM5m,  XMM5n,  XMM5o,  XMM5p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1040
                      XMM6,  XMM6b,  XMM6c,  XMM6d,  XMM6e,  XMM6f,  XMM6g,  XMM6h,  XMM6i,  XMM6j,  XMM6k,  XMM6l,  XMM6m,  XMM6n,  XMM6o,  XMM6p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1041
                      XMM7,  XMM7b,  XMM7c,  XMM7d,  XMM7e,  XMM7f,  XMM7g,  XMM7h,  XMM7i,  XMM7j,  XMM7k,  XMM7l,  XMM7m,  XMM7n,  XMM7o,  XMM7p
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1042
#ifdef _LP64
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1043
                     ,XMM8,  XMM8b,  XMM8c,  XMM8d,  XMM8e,  XMM8f,  XMM8g,  XMM8h,  XMM8i,  XMM8j,  XMM8k,  XMM8l,  XMM8m,  XMM8n,  XMM8o,  XMM8p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1044
                      XMM9,  XMM9b,  XMM9c,  XMM9d,  XMM9e,  XMM9f,  XMM9g,  XMM9h,  XMM9i,  XMM9j,  XMM9k,  XMM9l,  XMM9m,  XMM9n,  XMM9o,  XMM9p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1045
                      XMM10, XMM10b, XMM10c, XMM10d, XMM10e, XMM10f, XMM10g, XMM10h, XMM10i, XMM10j, XMM10k, XMM10l, XMM10m, XMM10n, XMM10o, XMM10p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1046
                      XMM11, XMM11b, XMM11c, XMM11d, XMM11e, XMM11f, XMM11g, XMM11h, XMM11i, XMM11j, XMM11k, XMM11l, XMM11m, XMM11n, XMM11o, XMM11p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1047
                      XMM12, XMM12b, XMM12c, XMM12d, XMM12e, XMM12f, XMM12g, XMM12h, XMM12i, XMM12j, XMM12k, XMM12l, XMM12m, XMM12n, XMM12o, XMM12p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1048
                      XMM13, XMM13b, XMM13c, XMM13d, XMM13e, XMM13f, XMM13g, XMM13h, XMM13i, XMM13j, XMM13k, XMM13l, XMM13m, XMM13n, XMM13o, XMM13p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1049
                      XMM14, XMM14b, XMM14c, XMM14d, XMM14e, XMM14f, XMM14g, XMM14h, XMM14i, XMM14j, XMM14k, XMM14l, XMM14m, XMM14n, XMM14o, XMM14p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1050
                      XMM15, XMM15b, XMM15c, XMM15d, XMM15e, XMM15f, XMM15g, XMM15h, XMM15i, XMM15j, XMM15k, XMM15l, XMM15m, XMM15n, XMM15o, XMM15p
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1051
                     ,XMM16, XMM16b, XMM16c, XMM16d, XMM16e, XMM16f, XMM16g, XMM16h, XMM16i, XMM16j, XMM16k, XMM16l, XMM16m, XMM16n, XMM16o, XMM16p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1052
                      XMM17, XMM17b, XMM17c, XMM17d, XMM17e, XMM17f, XMM17g, XMM17h, XMM17i, XMM17j, XMM17k, XMM17l, XMM17m, XMM17n, XMM17o, XMM17p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1053
                      XMM18, XMM18b, XMM18c, XMM18d, XMM18e, XMM18f, XMM18g, XMM18h, XMM18i, XMM18j, XMM18k, XMM18l, XMM18m, XMM18n, XMM18o, XMM18p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1054
                      XMM19, XMM19b, XMM19c, XMM19d, XMM19e, XMM19f, XMM19g, XMM19h, XMM19i, XMM19j, XMM19k, XMM19l, XMM19m, XMM19n, XMM19o, XMM19p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1055
                      XMM20, XMM20b, XMM20c, XMM20d, XMM20e, XMM20f, XMM20g, XMM20h, XMM20i, XMM20j, XMM20k, XMM20l, XMM20m, XMM20n, XMM20o, XMM20p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1056
                      XMM21, XMM21b, XMM21c, XMM21d, XMM21e, XMM21f, XMM21g, XMM21h, XMM21i, XMM21j, XMM21k, XMM21l, XMM21m, XMM21n, XMM21o, XMM21p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1057
                      XMM22, XMM22b, XMM22c, XMM22d, XMM22e, XMM22f, XMM22g, XMM22h, XMM22i, XMM22j, XMM22k, XMM22l, XMM22m, XMM22n, XMM22o, XMM22p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1058
                      XMM23, XMM23b, XMM23c, XMM23d, XMM23e, XMM23f, XMM23g, XMM23h, XMM23i, XMM23j, XMM23k, XMM23l, XMM23m, XMM23n, XMM23o, XMM23p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1059
                      XMM24, XMM24b, XMM24c, XMM24d, XMM24e, XMM24f, XMM24g, XMM24h, XMM24i, XMM24j, XMM24k, XMM24l, XMM24m, XMM24n, XMM24o, XMM24p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1060
                      XMM25, XMM25b, XMM25c, XMM25d, XMM25e, XMM25f, XMM25g, XMM25h, XMM25i, XMM25j, XMM25k, XMM25l, XMM25m, XMM25n, XMM25o, XMM25p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1061
                      XMM26, XMM26b, XMM26c, XMM26d, XMM26e, XMM26f, XMM26g, XMM26h, XMM26i, XMM26j, XMM26k, XMM26l, XMM26m, XMM26n, XMM26o, XMM26p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1062
                      XMM27, XMM27b, XMM27c, XMM27d, XMM27e, XMM27f, XMM27g, XMM27h, XMM27i, XMM27j, XMM27k, XMM27l, XMM27m, XMM27n, XMM27o, XMM27p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1063
                      XMM28, XMM28b, XMM28c, XMM28d, XMM28e, XMM28f, XMM28g, XMM28h, XMM28i, XMM28j, XMM28k, XMM28l, XMM28m, XMM28n, XMM28o, XMM28p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1064
                      XMM29, XMM29b, XMM29c, XMM29d, XMM29e, XMM29f, XMM29g, XMM29h, XMM29i, XMM29j, XMM29k, XMM29l, XMM29m, XMM29n, XMM29o, XMM29p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1065
                      XMM30, XMM30b, XMM30c, XMM30d, XMM30e, XMM30f, XMM30g, XMM30h, XMM30i, XMM30j, XMM30k, XMM30l, XMM30m, XMM30n, XMM30o, XMM30p,
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1066
                      XMM31, XMM31b, XMM31c, XMM31d, XMM31e, XMM31f, XMM31g, XMM31h, XMM31i, XMM31j, XMM31k, XMM31l, XMM31m, XMM31n, XMM31o, XMM31p
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1067
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1068
                      );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1069
50525
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1070
reg_class xmm0_reg(XMM0, XMM0b, XMM0c, XMM0d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1071
reg_class ymm0_reg(XMM0, XMM0b, XMM0c, XMM0d, XMM0e, XMM0f, XMM0g, XMM0h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1072
reg_class zmm0_reg(XMM0, XMM0b, XMM0c, XMM0d, XMM0e, XMM0f, XMM0g, XMM0h, XMM0i, XMM0j, XMM0k, XMM0l, XMM0m, XMM0n, XMM0o, XMM0p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1073
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1074
reg_class xmm1_reg(XMM1, XMM1b, XMM1c, XMM1d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1075
reg_class ymm1_reg(XMM1, XMM1b, XMM1c, XMM1d, XMM1e, XMM1f, XMM1g, XMM1h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1076
reg_class zmm1_reg(XMM1, XMM1b, XMM1c, XMM1d, XMM1e, XMM1f, XMM1g, XMM1h, XMM1i, XMM1j, XMM1k, XMM1l, XMM1m, XMM1n, XMM1o, XMM1p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1077
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1078
reg_class xmm2_reg(XMM2, XMM2b, XMM2c, XMM2d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1079
reg_class ymm2_reg(XMM2, XMM2b, XMM2c, XMM2d, XMM2e, XMM2f, XMM2g, XMM2h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1080
reg_class zmm2_reg(XMM2, XMM2b, XMM2c, XMM2d, XMM2e, XMM2f, XMM2g, XMM2h, XMM2i, XMM2j, XMM2k, XMM2l, XMM2m, XMM2n, XMM2o, XMM2p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1081
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1082
reg_class xmm3_reg(XMM3, XMM3b, XMM3c, XMM3d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1083
reg_class ymm3_reg(XMM3, XMM3b, XMM3c, XMM3d, XMM3e, XMM3f, XMM3g, XMM3h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1084
reg_class zmm3_reg(XMM3, XMM3b, XMM3c, XMM3d, XMM3e, XMM3f, XMM3g, XMM3h, XMM3i, XMM3j, XMM3k, XMM3l, XMM3m, XMM3n, XMM3o, XMM3p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1085
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1086
reg_class xmm4_reg(XMM4, XMM4b, XMM4c, XMM4d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1087
reg_class ymm4_reg(XMM4, XMM4b, XMM4c, XMM4d, XMM4e, XMM4f, XMM4g, XMM4h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1088
reg_class zmm4_reg(XMM4, XMM4b, XMM4c, XMM4d, XMM4e, XMM4f, XMM4g, XMM4h, XMM4i, XMM4j, XMM4k, XMM4l, XMM4m, XMM4n, XMM4o, XMM4p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1089
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1090
reg_class xmm5_reg(XMM5, XMM5b, XMM5c, XMM5d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1091
reg_class ymm5_reg(XMM5, XMM5b, XMM5c, XMM5d, XMM5e, XMM5f, XMM5g, XMM5h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1092
reg_class zmm5_reg(XMM5, XMM5b, XMM5c, XMM5d, XMM5e, XMM5f, XMM5g, XMM5h, XMM5i, XMM5j, XMM5k, XMM5l, XMM5m, XMM5n, XMM5o, XMM5p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1093
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1094
reg_class xmm6_reg(XMM6, XMM6b, XMM6c, XMM6d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1095
reg_class ymm6_reg(XMM6, XMM6b, XMM6c, XMM6d, XMM6e, XMM6f, XMM6g, XMM6h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1096
reg_class zmm6_reg(XMM6, XMM6b, XMM6c, XMM6d, XMM6e, XMM6f, XMM6g, XMM6h, XMM6i, XMM6j, XMM6k, XMM6l, XMM6m, XMM6n, XMM6o, XMM6p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1097
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1098
reg_class xmm7_reg(XMM7, XMM7b, XMM7c, XMM7d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1099
reg_class ymm7_reg(XMM7, XMM7b, XMM7c, XMM7d, XMM7e, XMM7f, XMM7g, XMM7h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1100
reg_class zmm7_reg(XMM7, XMM7b, XMM7c, XMM7d, XMM7e, XMM7f, XMM7g, XMM7h, XMM7i, XMM7j, XMM7k, XMM7l, XMM7m, XMM7n, XMM7o, XMM7p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1101
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1102
#ifdef _LP64
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1103
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1104
reg_class xmm8_reg(XMM8, XMM8b, XMM8c, XMM8d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1105
reg_class ymm8_reg(XMM8, XMM8b, XMM8c, XMM8d, XMM8e, XMM8f, XMM8g, XMM8h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1106
reg_class zmm8_reg(XMM8, XMM8b, XMM8c, XMM8d, XMM8e, XMM8f, XMM8g, XMM8h, XMM8i, XMM8j, XMM8k, XMM8l, XMM8m, XMM8n, XMM8o, XMM8p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1107
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1108
reg_class xmm9_reg(XMM9, XMM9b, XMM9c, XMM9d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1109
reg_class ymm9_reg(XMM9, XMM9b, XMM9c, XMM9d, XMM9e, XMM9f, XMM9g, XMM9h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1110
reg_class zmm9_reg(XMM9, XMM9b, XMM9c, XMM9d, XMM9e, XMM9f, XMM9g, XMM9h, XMM9i, XMM9j, XMM9k, XMM9l, XMM9m, XMM9n, XMM9o, XMM9p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1111
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1112
reg_class xmm10_reg(XMM10, XMM10b, XMM10c, XMM10d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1113
reg_class ymm10_reg(XMM10, XMM10b, XMM10c, XMM10d, XMM10e, XMM10f, XMM10g, XMM10h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1114
reg_class zmm10_reg(XMM10, XMM10b, XMM10c, XMM10d, XMM10e, XMM10f, XMM10g, XMM10h, XMM10i, XMM10j, XMM10k, XMM10l, XMM10m, XMM10n, XMM10o, XMM10p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1115
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1116
reg_class xmm11_reg(XMM11, XMM11b, XMM11c, XMM11d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1117
reg_class ymm11_reg(XMM11, XMM11b, XMM11c, XMM11d, XMM11e, XMM11f, XMM11g, XMM11h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1118
reg_class zmm11_reg(XMM11, XMM11b, XMM11c, XMM11d, XMM11e, XMM11f, XMM11g, XMM11h, XMM11i, XMM11j, XMM11k, XMM11l, XMM11m, XMM11n, XMM11o, XMM11p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1119
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1120
reg_class xmm12_reg(XMM12, XMM12b, XMM12c, XMM12d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1121
reg_class ymm12_reg(XMM12, XMM12b, XMM12c, XMM12d, XMM12e, XMM12f, XMM12g, XMM12h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1122
reg_class zmm12_reg(XMM12, XMM12b, XMM12c, XMM12d, XMM12e, XMM12f, XMM12g, XMM12h, XMM12i, XMM12j, XMM12k, XMM12l, XMM12m, XMM12n, XMM12o, XMM12p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1123
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1124
reg_class xmm13_reg(XMM13, XMM13b, XMM13c, XMM13d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1125
reg_class ymm13_reg(XMM13, XMM13b, XMM13c, XMM13d, XMM13e, XMM13f, XMM13g, XMM13h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1126
reg_class zmm13_reg(XMM13, XMM13b, XMM13c, XMM13d, XMM13e, XMM13f, XMM13g, XMM13h, XMM13i, XMM13j, XMM13k, XMM13l, XMM13m, XMM13n, XMM13o, XMM13p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1127
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1128
reg_class xmm14_reg(XMM14, XMM14b, XMM14c, XMM14d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1129
reg_class ymm14_reg(XMM14, XMM14b, XMM14c, XMM14d, XMM14e, XMM14f, XMM14g, XMM14h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1130
reg_class zmm14_reg(XMM14, XMM14b, XMM14c, XMM14d, XMM14e, XMM14f, XMM14g, XMM14h, XMM14i, XMM14j, XMM14k, XMM14l, XMM14m, XMM14n, XMM14o, XMM14p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1131
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1132
reg_class xmm15_reg(XMM15, XMM15b, XMM15c, XMM15d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1133
reg_class ymm15_reg(XMM15, XMM15b, XMM15c, XMM15d, XMM15e, XMM15f, XMM15g, XMM15h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1134
reg_class zmm15_reg(XMM15, XMM15b, XMM15c, XMM15d, XMM15e, XMM15f, XMM15g, XMM15h, XMM15i, XMM15j, XMM15k, XMM15l, XMM15m, XMM15n, XMM15o, XMM15p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1135
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1136
reg_class xmm16_reg(XMM16, XMM16b, XMM16c, XMM16d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1137
reg_class ymm16_reg(XMM16, XMM16b, XMM16c, XMM16d, XMM16e, XMM16f, XMM16g, XMM16h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1138
reg_class zmm16_reg(XMM16, XMM16b, XMM16c, XMM16d, XMM16e, XMM16f, XMM16g, XMM16h, XMM16i, XMM16j, XMM16k, XMM16l, XMM16m, XMM16n, XMM16o, XMM16p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1139
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1140
reg_class xmm17_reg(XMM17, XMM17b, XMM17c, XMM17d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1141
reg_class ymm17_reg(XMM17, XMM17b, XMM17c, XMM17d, XMM17e, XMM17f, XMM17g, XMM17h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1142
reg_class zmm17_reg(XMM17, XMM17b, XMM17c, XMM17d, XMM17e, XMM17f, XMM17g, XMM17h, XMM17i, XMM17j, XMM17k, XMM17l, XMM17m, XMM17n, XMM17o, XMM17p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1143
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1144
reg_class xmm18_reg(XMM18, XMM18b, XMM18c, XMM18d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1145
reg_class ymm18_reg(XMM18, XMM18b, XMM18c, XMM18d, XMM18e, XMM18f, XMM18g, XMM18h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1146
reg_class zmm18_reg(XMM18, XMM18b, XMM18c, XMM18d, XMM18e, XMM18f, XMM18g, XMM18h, XMM18i, XMM18j, XMM18k, XMM18l, XMM18m, XMM18n, XMM18o, XMM18p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1147
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1148
reg_class xmm19_reg(XMM19, XMM19b, XMM19c, XMM19d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1149
reg_class ymm19_reg(XMM19, XMM19b, XMM19c, XMM19d, XMM19e, XMM19f, XMM19g, XMM19h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1150
reg_class zmm19_reg(XMM19, XMM19b, XMM19c, XMM19d, XMM19e, XMM19f, XMM19g, XMM19h, XMM19i, XMM19j, XMM19k, XMM19l, XMM19m, XMM19n, XMM19o, XMM19p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1151
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1152
reg_class xmm20_reg(XMM20, XMM20b, XMM20c, XMM20d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1153
reg_class ymm20_reg(XMM20, XMM20b, XMM20c, XMM20d, XMM20e, XMM20f, XMM20g, XMM20h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1154
reg_class zmm20_reg(XMM20, XMM20b, XMM20c, XMM20d, XMM20e, XMM20f, XMM20g, XMM20h, XMM20i, XMM20j, XMM20k, XMM20l, XMM20m, XMM20n, XMM20o, XMM20p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1155
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1156
reg_class xmm21_reg(XMM21, XMM21b, XMM21c, XMM21d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1157
reg_class ymm21_reg(XMM21, XMM21b, XMM21c, XMM21d, XMM21e, XMM21f, XMM21g, XMM21h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1158
reg_class zmm21_reg(XMM21, XMM21b, XMM21c, XMM21d, XMM21e, XMM21f, XMM21g, XMM21h, XMM21i, XMM21j, XMM21k, XMM21l, XMM21m, XMM21n, XMM21o, XMM21p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1159
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1160
reg_class xmm22_reg(XMM22, XMM22b, XMM22c, XMM22d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1161
reg_class ymm22_reg(XMM22, XMM22b, XMM22c, XMM22d, XMM22e, XMM22f, XMM22g, XMM22h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1162
reg_class zmm22_reg(XMM22, XMM22b, XMM22c, XMM22d, XMM22e, XMM22f, XMM22g, XMM22h, XMM22i, XMM22j, XMM22k, XMM22l, XMM22m, XMM22n, XMM22o, XMM22p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1163
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1164
reg_class xmm23_reg(XMM23, XMM23b, XMM23c, XMM23d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1165
reg_class ymm23_reg(XMM23, XMM23b, XMM23c, XMM23d, XMM23e, XMM23f, XMM23g, XMM23h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1166
reg_class zmm23_reg(XMM23, XMM23b, XMM23c, XMM23d, XMM23e, XMM23f, XMM23g, XMM23h, XMM23i, XMM23j, XMM23k, XMM23l, XMM23m, XMM23n, XMM23o, XMM23p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1167
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1168
reg_class xmm24_reg(XMM24, XMM24b, XMM24c, XMM24d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1169
reg_class ymm24_reg(XMM24, XMM24b, XMM24c, XMM24d, XMM24e, XMM24f, XMM24g, XMM24h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1170
reg_class zmm24_reg(XMM24, XMM24b, XMM24c, XMM24d, XMM24e, XMM24f, XMM24g, XMM24h, XMM24i, XMM24j, XMM24k, XMM24l, XMM24m, XMM24n, XMM24o, XMM24p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1171
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1172
reg_class xmm25_reg(XMM25, XMM25b, XMM25c, XMM25d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1173
reg_class ymm25_reg(XMM25, XMM25b, XMM25c, XMM25d, XMM25e, XMM25f, XMM25g, XMM25h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1174
reg_class zmm25_reg(XMM25, XMM25b, XMM25c, XMM25d, XMM25e, XMM25f, XMM25g, XMM25h, XMM25i, XMM25j, XMM25k, XMM25l, XMM25m, XMM25n, XMM25o, XMM25p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1175
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1176
reg_class xmm26_reg(XMM26, XMM26b, XMM26c, XMM26d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1177
reg_class ymm26_reg(XMM26, XMM26b, XMM26c, XMM26d, XMM26e, XMM26f, XMM26g, XMM26h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1178
reg_class zmm26_reg(XMM26, XMM26b, XMM26c, XMM26d, XMM26e, XMM26f, XMM26g, XMM26h, XMM26i, XMM26j, XMM26k, XMM26l, XMM26m, XMM26n, XMM26o, XMM26p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1179
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1180
reg_class xmm27_reg(XMM27, XMM27b, XMM27c, XMM27d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1181
reg_class ymm27_reg(XMM27, XMM27b, XMM27c, XMM27d, XMM27e, XMM27f, XMM27g, XMM27h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1182
reg_class zmm27_reg(XMM27, XMM27b, XMM27c, XMM27d, XMM27e, XMM27f, XMM27g, XMM27h, XMM27i, XMM27j, XMM27k, XMM27l, XMM27m, XMM27n, XMM27o, XMM27p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1183
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1184
reg_class xmm28_reg(XMM28, XMM28b, XMM28c, XMM28d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1185
reg_class ymm28_reg(XMM28, XMM28b, XMM28c, XMM28d, XMM28e, XMM28f, XMM28g, XMM28h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1186
reg_class zmm28_reg(XMM28, XMM28b, XMM28c, XMM28d, XMM28e, XMM28f, XMM28g, XMM28h, XMM28i, XMM28j, XMM28k, XMM28l, XMM28m, XMM28n, XMM28o, XMM28p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1187
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1188
reg_class xmm29_reg(XMM29, XMM29b, XMM29c, XMM29d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1189
reg_class ymm29_reg(XMM29, XMM29b, XMM29c, XMM29d, XMM29e, XMM29f, XMM29g, XMM29h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1190
reg_class zmm29_reg(XMM29, XMM29b, XMM29c, XMM29d, XMM29e, XMM29f, XMM29g, XMM29h, XMM29i, XMM29j, XMM29k, XMM29l, XMM29m, XMM29n, XMM29o, XMM29p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1191
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1192
reg_class xmm30_reg(XMM30, XMM30b, XMM30c, XMM30d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1193
reg_class ymm30_reg(XMM30, XMM30b, XMM30c, XMM30d, XMM30e, XMM30f, XMM30g, XMM30h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1194
reg_class zmm30_reg(XMM30, XMM30b, XMM30c, XMM30d, XMM30e, XMM30f, XMM30g, XMM30h, XMM30i, XMM30j, XMM30k, XMM30l, XMM30m, XMM30n, XMM30o, XMM30p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1195
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1196
reg_class xmm31_reg(XMM31, XMM31b, XMM31c, XMM31d);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1197
reg_class ymm31_reg(XMM31, XMM31b, XMM31c, XMM31d, XMM31e, XMM31f, XMM31g, XMM31h);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1198
reg_class zmm31_reg(XMM31, XMM31b, XMM31c, XMM31d, XMM31e, XMM31f, XMM31g, XMM31h, XMM31i, XMM31j, XMM31k, XMM31l, XMM31m, XMM31n, XMM31o, XMM31p);
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1199
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1200
#endif
767cdb97f103 8204210: Implementation: JEP 333: ZGC: A Scalable Low-Latency Garbage Collector (Experimental)
pliden
parents: 49384
diff changeset
  1201
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1202
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1203
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1204
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1205
//----------SOURCE BLOCK-------------------------------------------------------
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1206
// This is a block of C++ code which provides values, functions, and
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1207
// definitions necessary in the rest of the architecture description
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1208
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1209
source_hpp %{
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1210
// Header information of the source block.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1211
// Method declarations/definitions which are used outside
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1212
// the ad-scope can conveniently be defined here.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1213
//
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1214
// To keep related declarations/definitions/uses close together,
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1215
// we switch between source %{ }% and source_hpp %{ }% freely as needed.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1216
25715
d5a8dbdc5150 8049325: Introduce and clean up umbrella headers for the files in the cpu subdirectories.
goetz
parents: 23498
diff changeset
  1217
class NativeJump;
d5a8dbdc5150 8049325: Introduce and clean up umbrella headers for the files in the cpu subdirectories.
goetz
parents: 23498
diff changeset
  1218
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1219
class CallStubImpl {
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1220
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1221
  //--------------------------------------------------------------
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1222
  //---<  Used for optimization in Compile::shorten_branches  >---
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1223
  //--------------------------------------------------------------
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1224
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1225
 public:
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1226
  // Size of call trampoline stub.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1227
  static uint size_call_trampoline() {
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1228
    return 0; // no call trampolines on this platform
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1229
  }
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1230
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1231
  // number of relocations needed by a call trampoline stub
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1232
  static uint reloc_call_trampoline() {
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1233
    return 0; // no call trampolines on this platform
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1234
  }
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1235
};
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1236
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1237
class HandlerImpl {
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1238
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1239
 public:
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1240
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1241
  static int emit_exception_handler(CodeBuffer &cbuf);
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1242
  static int emit_deopt_handler(CodeBuffer& cbuf);
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1243
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1244
  static uint size_exception_handler() {
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1245
    // NativeCall instruction size is the same as NativeJump.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1246
    // exception handler starts out as jump and can be patched to
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1247
    // a call be deoptimization.  (4932387)
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1248
    // Note that this value is also credited (in output.cpp) to
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1249
    // the size of the code section.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1250
    return NativeJump::instruction_size;
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1251
  }
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1252
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1253
#ifdef _LP64
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1254
  static uint size_deopt_handler() {
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1255
    // three 5 byte instructions
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1256
    return 15;
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1257
  }
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1258
#else
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1259
  static uint size_deopt_handler() {
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1260
    // NativeCall instruction size is the same as NativeJump.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1261
    // exception handler starts out as jump and can be patched to
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1262
    // a call be deoptimization.  (4932387)
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1263
    // Note that this value is also credited (in output.cpp) to
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1264
    // the size of the code section.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1265
    return 5 + NativeJump::instruction_size; // pushl(); jmp;
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1266
  }
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1267
#endif
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1268
};
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1269
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1270
%} // end source_hpp
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1271
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1272
source %{
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1273
38286
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1274
#include "opto/addnode.hpp"
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1275
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1276
// Emit exception handler code.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1277
// Stuff framesize into a register and call a VM stub routine.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1278
int HandlerImpl::emit_exception_handler(CodeBuffer& cbuf) {
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1279
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1280
  // Note that the code buffer's insts_mark is always relative to insts.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1281
  // That's why we must use the macroassembler to generate a handler.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1282
  MacroAssembler _masm(&cbuf);
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1283
  address base = __ start_a_stub(size_exception_handler());
32082
2a3323e25de1 8130309: Need to bailout cleanly if creation of stubs fails when codecache is out of space
thartmann
parents: 31410
diff changeset
  1284
  if (base == NULL) {
2a3323e25de1 8130309: Need to bailout cleanly if creation of stubs fails when codecache is out of space
thartmann
parents: 31410
diff changeset
  1285
    ciEnv::current()->record_failure("CodeCache is full");
2a3323e25de1 8130309: Need to bailout cleanly if creation of stubs fails when codecache is out of space
thartmann
parents: 31410
diff changeset
  1286
    return 0;  // CodeBuffer::expand failed
2a3323e25de1 8130309: Need to bailout cleanly if creation of stubs fails when codecache is out of space
thartmann
parents: 31410
diff changeset
  1287
  }
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1288
  int offset = __ offset();
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1289
  __ jump(RuntimeAddress(OptoRuntime::exception_blob()->entry_point()));
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1290
  assert(__ offset() - offset <= (int) size_exception_handler(), "overflow");
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1291
  __ end_a_stub();
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1292
  return offset;
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1293
}
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1294
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1295
// Emit deopt handler code.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1296
int HandlerImpl::emit_deopt_handler(CodeBuffer& cbuf) {
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1297
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1298
  // Note that the code buffer's insts_mark is always relative to insts.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1299
  // That's why we must use the macroassembler to generate a handler.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1300
  MacroAssembler _masm(&cbuf);
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1301
  address base = __ start_a_stub(size_deopt_handler());
32082
2a3323e25de1 8130309: Need to bailout cleanly if creation of stubs fails when codecache is out of space
thartmann
parents: 31410
diff changeset
  1302
  if (base == NULL) {
2a3323e25de1 8130309: Need to bailout cleanly if creation of stubs fails when codecache is out of space
thartmann
parents: 31410
diff changeset
  1303
    ciEnv::current()->record_failure("CodeCache is full");
2a3323e25de1 8130309: Need to bailout cleanly if creation of stubs fails when codecache is out of space
thartmann
parents: 31410
diff changeset
  1304
    return 0;  // CodeBuffer::expand failed
2a3323e25de1 8130309: Need to bailout cleanly if creation of stubs fails when codecache is out of space
thartmann
parents: 31410
diff changeset
  1305
  }
23498
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1306
  int offset = __ offset();
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1307
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1308
#ifdef _LP64
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1309
  address the_pc = (address) __ pc();
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1310
  Label next;
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1311
  // push a "the_pc" on the stack without destroying any registers
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1312
  // as they all may be live.
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1313
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1314
  // push address of "next"
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1315
  __ call(next, relocInfo::none); // reloc none is fine since it is a disp32
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1316
  __ bind(next);
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1317
  // adjust it so it matches "the_pc"
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1318
  __ subptr(Address(rsp, 0), __ offset() - offset);
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1319
#else
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1320
  InternalAddress here(__ pc());
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1321
  __ pushptr(here.addr());
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1322
#endif
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1323
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1324
  __ jump(RuntimeAddress(SharedRuntime::deopt_blob()->unpack()));
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1325
  assert(__ offset() - offset <= (int) size_deopt_handler(), "overflow");
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1326
  __ end_a_stub();
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1327
  return offset;
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1328
}
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1329
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1330
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1331
//=============================================================================
a0e67b766e5c 8037821: Account for trampoline stubs when estimating code buffer sizes
goetz
parents: 22505
diff changeset
  1332
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1333
  // Float masks come from different places depending on platform.
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1334
#ifdef _LP64
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1335
  static address float_signmask()  { return StubRoutines::x86::float_sign_mask(); }
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1336
  static address float_signflip()  { return StubRoutines::x86::float_sign_flip(); }
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1337
  static address double_signmask() { return StubRoutines::x86::double_sign_mask(); }
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1338
  static address double_signflip() { return StubRoutines::x86::double_sign_flip(); }
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1339
#else
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1340
  static address float_signmask()  { return (address)float_signmask_pool; }
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1341
  static address float_signflip()  { return (address)float_signflip_pool; }
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1342
  static address double_signmask() { return (address)double_signmask_pool; }
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1343
  static address double_signflip() { return (address)double_signflip_pool; }
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1344
#endif
11794
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1345
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1346
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1347
const bool Matcher::match_rule_supported(int opcode) {
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1348
  if (!has_match_rule(opcode))
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1349
    return false;
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1350
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1351
  bool ret_value = true;
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1352
  switch (opcode) {
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1353
    case Op_PopCountI:
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1354
    case Op_PopCountL:
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1355
      if (!UsePopCountInstruction)
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1356
        ret_value = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1357
      break;
49384
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  1358
    case Op_PopCountVI:
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  1359
      if (!UsePopCountInstruction || !VM_Version::supports_vpopcntdq())
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  1360
        ret_value = false;
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
  1361
      break;
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1362
    case Op_MulVI:
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1363
      if ((UseSSE < 4) && (UseAVX < 1)) // only with SSE4_1 or AVX
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1364
        ret_value = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1365
      break;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1366
    case Op_MulVL:
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1367
    case Op_MulReductionVL:
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1368
      if (VM_Version::supports_avx512dq() == false)
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1369
        ret_value = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1370
      break;
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1371
    case Op_AddReductionVL:
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1372
      if (UseAVX < 3) // only EVEX : vector connectivity becomes an issue here
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1373
        ret_value = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1374
      break;
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1375
    case Op_AddReductionVI:
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1376
      if (UseSSE < 3) // requires at least SSE3
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1377
        ret_value = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1378
      break;
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1379
    case Op_MulReductionVI:
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1380
      if (UseSSE < 4) // requires at least SSE4
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1381
        ret_value = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1382
      break;
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1383
    case Op_AddReductionVF:
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1384
    case Op_AddReductionVD:
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1385
    case Op_MulReductionVF:
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1386
    case Op_MulReductionVD:
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  1387
      if (UseSSE < 1) // requires at least SSE
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1388
        ret_value = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1389
      break;
32723
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  1390
    case Op_SqrtVD:
48089
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  1391
    case Op_SqrtVF:
32723
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  1392
      if (UseAVX < 1) // enabled for AVX only
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1393
        ret_value = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1394
      break;
13886
8d82c4dfa722 7023898: Intrinsify AtomicLongFieldUpdater.getAndIncrement()
roland
parents: 13883
diff changeset
  1395
    case Op_CompareAndSwapL:
8d82c4dfa722 7023898: Intrinsify AtomicLongFieldUpdater.getAndIncrement()
roland
parents: 13883
diff changeset
  1396
#ifdef _LP64
8d82c4dfa722 7023898: Intrinsify AtomicLongFieldUpdater.getAndIncrement()
roland
parents: 13883
diff changeset
  1397
    case Op_CompareAndSwapP:
8d82c4dfa722 7023898: Intrinsify AtomicLongFieldUpdater.getAndIncrement()
roland
parents: 13883
diff changeset
  1398
#endif
8d82c4dfa722 7023898: Intrinsify AtomicLongFieldUpdater.getAndIncrement()
roland
parents: 13883
diff changeset
  1399
      if (!VM_Version::supports_cx8())
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1400
        ret_value = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1401
      break;
48309
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  1402
    case Op_CMoveVF:
33469
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1403
    case Op_CMoveVD:
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1404
      if (UseAVX < 1 || UseAVX > 2)
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1405
        ret_value = false;
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1406
      break;
35581
dd47cf4734f2 8145336: PPC64: fix string intrinsics after CompactStrings change
simonis
parents: 34162
diff changeset
  1407
    case Op_StrIndexOf:
dd47cf4734f2 8145336: PPC64: fix string intrinsics after CompactStrings change
simonis
parents: 34162
diff changeset
  1408
      if (!UseSSE42Intrinsics)
dd47cf4734f2 8145336: PPC64: fix string intrinsics after CompactStrings change
simonis
parents: 34162
diff changeset
  1409
        ret_value = false;
dd47cf4734f2 8145336: PPC64: fix string intrinsics after CompactStrings change
simonis
parents: 34162
diff changeset
  1410
      break;
dd47cf4734f2 8145336: PPC64: fix string intrinsics after CompactStrings change
simonis
parents: 34162
diff changeset
  1411
    case Op_StrIndexOfChar:
39253
bd5fe208734e 8157842: indexOfChar intrinsic is not emitted on x86
thartmann
parents: 38286
diff changeset
  1412
      if (!UseSSE42Intrinsics)
35581
dd47cf4734f2 8145336: PPC64: fix string intrinsics after CompactStrings change
simonis
parents: 34162
diff changeset
  1413
        ret_value = false;
dd47cf4734f2 8145336: PPC64: fix string intrinsics after CompactStrings change
simonis
parents: 34162
diff changeset
  1414
      break;
38017
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  1415
    case Op_OnSpinWait:
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  1416
      if (VM_Version::supports_on_spin_wait() == false)
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  1417
        ret_value = false;
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  1418
      break;
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1419
  }
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1420
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1421
  return ret_value;  // Per default match rules are supported.
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1422
}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  1423
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1424
const bool Matcher::match_rule_supported_vector(int opcode, int vlen) {
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1425
  // identify extra cases that we might want to provide match rules for
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1426
  // e.g. Op_ vector nodes and other intrinsics while guarding with vlen
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1427
  bool ret_value = match_rule_supported(opcode);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1428
  if (ret_value) {
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1429
    switch (opcode) {
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1430
      case Op_AddVB:
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1431
      case Op_SubVB:
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1432
        if ((vlen == 64) && (VM_Version::supports_avx512bw() == false))
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1433
          ret_value = false;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1434
        break;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1435
      case Op_URShiftVS:
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1436
      case Op_RShiftVS:
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1437
      case Op_LShiftVS:
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1438
      case Op_MulVS:
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1439
      case Op_AddVS:
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1440
      case Op_SubVS:
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1441
        if ((vlen == 32) && (VM_Version::supports_avx512bw() == false))
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1442
          ret_value = false;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1443
        break;
48309
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  1444
      case Op_CMoveVF:
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  1445
        if (vlen != 8)
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  1446
          ret_value  = false;
51078
fc6cfe40e32a 8207049: Minor improvements of compiler code.
goetz
parents: 50525
diff changeset
  1447
        break;
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1448
      case Op_CMoveVD:
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1449
        if (vlen != 4)
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1450
          ret_value  = false;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1451
        break;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1452
    }
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1453
  }
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1454
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1455
  return ret_value;  // Per default match rules are supported.
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1456
}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1457
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1458
const bool Matcher::has_predicated_vectors(void) {
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1459
  bool ret_value = false;
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1460
  if (UseAVX > 2) {
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1461
    ret_value = VM_Version::supports_avx512vl();
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1462
  }
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1463
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1464
  return ret_value;
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1465
}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1466
33065
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1467
const int Matcher::float_pressure(int default_pressure_threshold) {
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1468
  int float_pressure_threshold = default_pressure_threshold;
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1469
#ifdef _LP64
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1470
  if (UseAVX > 2) {
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1471
    // Increase pressure threshold on machines with AVX3 which have
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1472
    // 2x more XMM registers.
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1473
    float_pressure_threshold = default_pressure_threshold * 2;
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1474
  }
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1475
#endif
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1476
  return float_pressure_threshold;
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1477
}
55892792936f 8134802: LCM register pressure scheduling
mcberg
parents: 32727
diff changeset
  1478
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1479
// Max vector size in bytes. 0 if not supported.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1480
const int Matcher::vector_width_in_bytes(BasicType bt) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1481
  assert(is_java_primitive(bt), "only primitive type vectors");
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1482
  if (UseSSE < 2) return 0;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1483
  // SSE2 supports 128bit vectors for all types.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1484
  // AVX2 supports 256bit vectors for all types.
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1485
  // AVX2/EVEX supports 512bit vectors for all types.
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1486
  int size = (UseAVX > 1) ? (1 << UseAVX) * 8 : 16;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1487
  // AVX1 supports 256bit vectors only for FLOAT and DOUBLE.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1488
  if (UseAVX > 0 && (bt == T_FLOAT || bt == T_DOUBLE))
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1489
    size = (UseAVX > 2) ? 64 : 32;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1490
  // Use flag to limit vector size.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1491
  size = MIN2(size,(int)MaxVectorSize);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1492
  // Minimum 2 values in vector (or 4 for bytes).
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1493
  switch (bt) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1494
  case T_DOUBLE:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1495
  case T_LONG:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1496
    if (size < 16) return 0;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1497
    break;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1498
  case T_FLOAT:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1499
  case T_INT:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1500
    if (size < 8) return 0;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1501
    break;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1502
  case T_BOOLEAN:
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1503
    if (size < 4) return 0;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1504
    break;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1505
  case T_CHAR:
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1506
    if (size < 4) return 0;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1507
    break;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1508
  case T_BYTE:
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1509
    if (size < 4) return 0;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1510
    break;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1511
  case T_SHORT:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1512
    if (size < 4) return 0;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1513
    break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1514
  default:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1515
    ShouldNotReachHere();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1516
  }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1517
  return size;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1518
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1519
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1520
// Limits on vector size (number of elements) loaded into vector.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1521
const int Matcher::max_vector_size(const BasicType bt) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1522
  return vector_width_in_bytes(bt)/type2aelembytes(bt);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1523
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1524
const int Matcher::min_vector_size(const BasicType bt) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1525
  int max_size = max_vector_size(bt);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1526
  // Min size which can be loaded into vector is 4 bytes.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1527
  int size = (type2aelembytes(bt) == 1) ? 4 : 2;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1528
  return MIN2(size,max_size);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1529
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1530
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1531
// Vector ideal reg corresponding to specidied size in bytes
46378
4ccca1fdf627 8160748: Inconsistent types for ideal_reg
kbarrett
parents: 42039
diff changeset
  1532
const uint Matcher::vector_ideal_reg(int size) {
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1533
  assert(MaxVectorSize >= size, "");
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1534
  switch(size) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1535
    case  4: return Op_VecS;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1536
    case  8: return Op_VecD;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1537
    case 16: return Op_VecX;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1538
    case 32: return Op_VecY;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1539
    case 64: return Op_VecZ;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1540
  }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1541
  ShouldNotReachHere();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1542
  return 0;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1543
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1544
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  1545
// Only lowest bits of xmm reg are used for vector shift count.
46378
4ccca1fdf627 8160748: Inconsistent types for ideal_reg
kbarrett
parents: 42039
diff changeset
  1546
const uint Matcher::vector_shift_count_ideal_reg(int size) {
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  1547
  return Op_VecS;
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  1548
}
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  1549
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1550
// x86 supports misaligned vectors store/load.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1551
const bool Matcher::misaligned_vectors_ok() {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1552
  return !AlignVector; // can be changed by flag
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1553
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1554
22505
4523090c9674 8002074: Support for AES on SPARC
kvn
parents: 14131
diff changeset
  1555
// x86 AES instructions are compatible with SunJCE expanded
4523090c9674 8002074: Support for AES on SPARC
kvn
parents: 14131
diff changeset
  1556
// keys, hence we do not need to pass the original key to stubs
4523090c9674 8002074: Support for AES on SPARC
kvn
parents: 14131
diff changeset
  1557
const bool Matcher::pass_original_key_for_aes() {
4523090c9674 8002074: Support for AES on SPARC
kvn
parents: 14131
diff changeset
  1558
  return false;
4523090c9674 8002074: Support for AES on SPARC
kvn
parents: 14131
diff changeset
  1559
}
4523090c9674 8002074: Support for AES on SPARC
kvn
parents: 14131
diff changeset
  1560
38286
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1561
38236
510f77046e00 8154943: AArch64: redundant address computation instructions with vectorization
roland
parents: 38049
diff changeset
  1562
const bool Matcher::convi2l_type_required = true;
510f77046e00 8154943: AArch64: redundant address computation instructions with vectorization
roland
parents: 38049
diff changeset
  1563
38286
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1564
// Check for shift by small constant as well
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1565
static bool clone_shift(Node* shift, Matcher* matcher, Matcher::MStack& mstack, VectorSet& address_visited) {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1566
  if (shift->Opcode() == Op_LShiftX && shift->in(2)->is_Con() &&
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1567
      shift->in(2)->get_int() <= 3 &&
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1568
      // Are there other uses besides address expressions?
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1569
      !matcher->is_visited(shift)) {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1570
    address_visited.set(shift->_idx); // Flag as address_visited
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1571
    mstack.push(shift->in(2), Matcher::Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1572
    Node *conv = shift->in(1);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1573
#ifdef _LP64
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1574
    // Allow Matcher to match the rule which bypass
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1575
    // ConvI2L operation for an array index on LP64
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1576
    // if the index value is positive.
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1577
    if (conv->Opcode() == Op_ConvI2L &&
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1578
        conv->as_Type()->type()->is_long()->_lo >= 0 &&
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1579
        // Are there other uses besides address expressions?
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1580
        !matcher->is_visited(conv)) {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1581
      address_visited.set(conv->_idx); // Flag as address_visited
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1582
      mstack.push(conv->in(1), Matcher::Pre_Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1583
    } else
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1584
#endif
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1585
      mstack.push(conv, Matcher::Pre_Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1586
    return true;
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1587
  }
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1588
  return false;
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1589
}
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1590
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1591
// Should the Matcher clone shifts on addressing modes, expecting them
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1592
// to be subsumed into complex addressing expressions or compute them
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1593
// into registers?
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1594
bool Matcher::clone_address_expressions(AddPNode* m, Matcher::MStack& mstack, VectorSet& address_visited) {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1595
  Node *off = m->in(AddPNode::Offset);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1596
  if (off->is_Con()) {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1597
    address_visited.test_set(m->_idx); // Flag as address_visited
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1598
    Node *adr = m->in(AddPNode::Address);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1599
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1600
    // Intel can handle 2 adds in addressing mode
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1601
    // AtomicAdd is not an addressing expression.
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1602
    // Cheap to find it by looking for screwy base.
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1603
    if (adr->is_AddP() &&
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1604
        !adr->in(AddPNode::Base)->is_top() &&
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1605
        // Are there other uses besides address expressions?
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1606
        !is_visited(adr)) {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1607
      address_visited.set(adr->_idx); // Flag as address_visited
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1608
      Node *shift = adr->in(AddPNode::Offset);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1609
      if (!clone_shift(shift, this, mstack, address_visited)) {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1610
        mstack.push(shift, Pre_Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1611
      }
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1612
      mstack.push(adr->in(AddPNode::Address), Pre_Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1613
      mstack.push(adr->in(AddPNode::Base), Pre_Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1614
    } else {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1615
      mstack.push(adr, Pre_Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1616
    }
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1617
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1618
    // Clone X+offset as it also folds into most addressing expressions
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1619
    mstack.push(off, Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1620
    mstack.push(m->in(AddPNode::Base), Pre_Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1621
    return true;
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1622
  } else if (clone_shift(off, this, mstack, address_visited)) {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1623
    address_visited.test_set(m->_idx); // Flag as address_visited
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1624
    mstack.push(m->in(AddPNode::Address), Pre_Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1625
    mstack.push(m->in(AddPNode::Base), Pre_Visit);
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1626
    return true;
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1627
  }
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1628
  return false;
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1629
}
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1630
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1631
void Compile::reshape_address(AddPNode* addp) {
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1632
}
0ddb6f84e138 8154826: AArch64: take advantage better of base + shifted offset addressing mode
roland
parents: 38236
diff changeset
  1633
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1634
// Helper methods for MachSpillCopyNode::implementation().
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1635
static int vec_mov_helper(CodeBuffer *cbuf, bool do_size, int src_lo, int dst_lo,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1636
                          int src_hi, int dst_hi, uint ireg, outputStream* st) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1637
  // In 64-bit VM size calculation is very complex. Emitting instructions
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1638
  // into scratch buffer is used to get size in 64-bit VM.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1639
  LP64_ONLY( assert(!do_size, "this method calculates size only for 32-bit VM"); )
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1640
  assert(ireg == Op_VecS || // 32bit vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1641
         (src_lo & 1) == 0 && (src_lo + 1) == src_hi &&
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1642
         (dst_lo & 1) == 0 && (dst_lo + 1) == dst_hi,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1643
         "no non-adjacent vector moves" );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1644
  if (cbuf) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1645
    MacroAssembler _masm(cbuf);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1646
    int offset = __ offset();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1647
    switch (ireg) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1648
    case Op_VecS: // copy whole register
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1649
    case Op_VecD:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1650
    case Op_VecX:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1651
      __ movdqu(as_XMMRegister(Matcher::_regEncode[dst_lo]), as_XMMRegister(Matcher::_regEncode[src_lo]));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1652
      break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1653
    case Op_VecY:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1654
      __ vmovdqu(as_XMMRegister(Matcher::_regEncode[dst_lo]), as_XMMRegister(Matcher::_regEncode[src_lo]));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1655
      break;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1656
    case Op_VecZ:
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1657
      __ evmovdquq(as_XMMRegister(Matcher::_regEncode[dst_lo]), as_XMMRegister(Matcher::_regEncode[src_lo]), 2);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1658
      break;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1659
    default:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1660
      ShouldNotReachHere();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1661
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1662
    int size = __ offset() - offset;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1663
#ifdef ASSERT
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1664
    // VEX_2bytes prefix is used if UseAVX > 0, so it takes the same 2 bytes as SIMD prefix.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1665
    assert(!do_size || size == 4, "incorrect size calculattion");
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1666
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1667
    return size;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1668
#ifndef PRODUCT
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1669
  } else if (!do_size) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1670
    switch (ireg) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1671
    case Op_VecS:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1672
    case Op_VecD:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1673
    case Op_VecX:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1674
      st->print("movdqu  %s,%s\t# spill",Matcher::regName[dst_lo],Matcher::regName[src_lo]);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1675
      break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1676
    case Op_VecY:
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1677
    case Op_VecZ:
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1678
      st->print("vmovdqu %s,%s\t# spill",Matcher::regName[dst_lo],Matcher::regName[src_lo]);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1679
      break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1680
    default:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1681
      ShouldNotReachHere();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1682
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1683
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1684
  }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1685
  // VEX_2bytes prefix is used if UseAVX > 0, and it takes the same 2 bytes as SIMD prefix.
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1686
  return (UseAVX > 2) ? 6 : 4;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1687
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1688
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1689
static int vec_spill_helper(CodeBuffer *cbuf, bool do_size, bool is_load,
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1690
                            int stack_offset, int reg, uint ireg, outputStream* st) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1691
  // In 64-bit VM size calculation is very complex. Emitting instructions
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1692
  // into scratch buffer is used to get size in 64-bit VM.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1693
  LP64_ONLY( assert(!do_size, "this method calculates size only for 32-bit VM"); )
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1694
  if (cbuf) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1695
    MacroAssembler _masm(cbuf);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1696
    int offset = __ offset();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1697
    if (is_load) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1698
      switch (ireg) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1699
      case Op_VecS:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1700
        __ movdl(as_XMMRegister(Matcher::_regEncode[reg]), Address(rsp, stack_offset));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1701
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1702
      case Op_VecD:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1703
        __ movq(as_XMMRegister(Matcher::_regEncode[reg]), Address(rsp, stack_offset));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1704
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1705
      case Op_VecX:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1706
        __ movdqu(as_XMMRegister(Matcher::_regEncode[reg]), Address(rsp, stack_offset));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1707
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1708
      case Op_VecY:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1709
        __ vmovdqu(as_XMMRegister(Matcher::_regEncode[reg]), Address(rsp, stack_offset));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1710
        break;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1711
      case Op_VecZ:
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1712
        __ evmovdquq(as_XMMRegister(Matcher::_regEncode[reg]), Address(rsp, stack_offset), 2);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1713
        break;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1714
      default:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1715
        ShouldNotReachHere();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1716
      }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1717
    } else { // store
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1718
      switch (ireg) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1719
      case Op_VecS:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1720
        __ movdl(Address(rsp, stack_offset), as_XMMRegister(Matcher::_regEncode[reg]));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1721
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1722
      case Op_VecD:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1723
        __ movq(Address(rsp, stack_offset), as_XMMRegister(Matcher::_regEncode[reg]));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1724
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1725
      case Op_VecX:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1726
        __ movdqu(Address(rsp, stack_offset), as_XMMRegister(Matcher::_regEncode[reg]));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1727
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1728
      case Op_VecY:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1729
        __ vmovdqu(Address(rsp, stack_offset), as_XMMRegister(Matcher::_regEncode[reg]));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1730
        break;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1731
      case Op_VecZ:
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1732
        __ evmovdquq(Address(rsp, stack_offset), as_XMMRegister(Matcher::_regEncode[reg]), 2);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1733
        break;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1734
      default:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1735
        ShouldNotReachHere();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1736
      }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1737
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1738
    int size = __ offset() - offset;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1739
#ifdef ASSERT
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1740
    int offset_size = (stack_offset == 0) ? 0 : ((stack_offset < 0x80) ? 1 : (UseAVX > 2) ? 6 : 4);
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1741
    // VEX_2bytes prefix is used if UseAVX > 0, so it takes the same 2 bytes as SIMD prefix.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1742
    assert(!do_size || size == (5+offset_size), "incorrect size calculattion");
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1743
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1744
    return size;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1745
#ifndef PRODUCT
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1746
  } else if (!do_size) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1747
    if (is_load) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1748
      switch (ireg) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1749
      case Op_VecS:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1750
        st->print("movd    %s,[rsp + %d]\t# spill", Matcher::regName[reg], stack_offset);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1751
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1752
      case Op_VecD:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1753
        st->print("movq    %s,[rsp + %d]\t# spill", Matcher::regName[reg], stack_offset);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1754
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1755
       case Op_VecX:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1756
        st->print("movdqu  %s,[rsp + %d]\t# spill", Matcher::regName[reg], stack_offset);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1757
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1758
      case Op_VecY:
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1759
      case Op_VecZ:
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1760
        st->print("vmovdqu %s,[rsp + %d]\t# spill", Matcher::regName[reg], stack_offset);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1761
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1762
      default:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1763
        ShouldNotReachHere();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1764
      }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1765
    } else { // store
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1766
      switch (ireg) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1767
      case Op_VecS:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1768
        st->print("movd    [rsp + %d],%s\t# spill", stack_offset, Matcher::regName[reg]);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1769
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1770
      case Op_VecD:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1771
        st->print("movq    [rsp + %d],%s\t# spill", stack_offset, Matcher::regName[reg]);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1772
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1773
       case Op_VecX:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1774
        st->print("movdqu  [rsp + %d],%s\t# spill", stack_offset, Matcher::regName[reg]);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1775
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1776
      case Op_VecY:
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1777
      case Op_VecZ:
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1778
        st->print("vmovdqu [rsp + %d],%s\t# spill", stack_offset, Matcher::regName[reg]);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1779
        break;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1780
      default:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1781
        ShouldNotReachHere();
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1782
      }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1783
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1784
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1785
  }
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1786
  bool is_single_byte = false;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1787
  int vec_len = 0;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1788
  if ((UseAVX > 2) && (stack_offset != 0)) {
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1789
    int tuple_type = Assembler::EVEX_FVM;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1790
    int input_size = Assembler::EVEX_32bit;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1791
    switch (ireg) {
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1792
    case Op_VecS:
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1793
      tuple_type = Assembler::EVEX_T1S;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1794
      break;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1795
    case Op_VecD:
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1796
      tuple_type = Assembler::EVEX_T1S;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1797
      input_size = Assembler::EVEX_64bit;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1798
      break;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1799
    case Op_VecX:
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1800
      break;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1801
    case Op_VecY:
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1802
      vec_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1803
      break;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1804
    case Op_VecZ:
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1805
      vec_len = 2;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1806
      break;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1807
    }
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1808
    is_single_byte = Assembler::query_compressed_disp_byte(stack_offset, true, vec_len, tuple_type, input_size, 0);
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1809
  }
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1810
  int offset_size = 0;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1811
  int size = 5;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1812
  if (UseAVX > 2 ) {
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1813
    if (VM_Version::supports_avx512novl() && (vec_len == 2)) {
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1814
      offset_size = (stack_offset == 0) ? 0 : ((is_single_byte) ? 1 : 4);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1815
      size += 2; // Need an additional two bytes for EVEX encoding
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  1816
    } else if (VM_Version::supports_avx512novl() && (vec_len < 2)) {
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1817
      offset_size = (stack_offset == 0) ? 0 : ((stack_offset <= 127) ? 1 : 4);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1818
    } else {
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1819
      offset_size = (stack_offset == 0) ? 0 : ((is_single_byte) ? 1 : 4);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1820
      size += 2; // Need an additional two bytes for EVEX encodding
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1821
    }
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1822
  } else {
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1823
    offset_size = (stack_offset == 0) ? 0 : ((stack_offset <= 127) ? 1 : 4);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1824
  }
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1825
  // VEX_2bytes prefix is used if UseAVX > 0, so it takes the same 2 bytes as SIMD prefix.
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  1826
  return size+offset_size;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1827
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1828
40040
7644f470d923 8160425: Vectorization with signalling NaN returns wrong result
thartmann
parents: 39253
diff changeset
  1829
static inline jint replicate4_imm(int con, int width) {
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1830
  // Load a constant of "width" (in bytes) and replicate it to fill 32bit.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1831
  assert(width == 1 || width == 2, "only byte or short types here");
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1832
  int bit_width = width * 8;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1833
  jint val = con;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1834
  val &= (1 << bit_width) - 1;  // mask off sign bits
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1835
  while(bit_width < 32) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1836
    val |= (val << bit_width);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1837
    bit_width <<= 1;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1838
  }
40040
7644f470d923 8160425: Vectorization with signalling NaN returns wrong result
thartmann
parents: 39253
diff changeset
  1839
  return val;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1840
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1841
40040
7644f470d923 8160425: Vectorization with signalling NaN returns wrong result
thartmann
parents: 39253
diff changeset
  1842
static inline jlong replicate8_imm(int con, int width) {
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1843
  // Load a constant of "width" (in bytes) and replicate it to fill 64bit.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1844
  assert(width == 1 || width == 2 || width == 4, "only byte, short or int types here");
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1845
  int bit_width = width * 8;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1846
  jlong val = con;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1847
  val &= (((jlong) 1) << bit_width) - 1;  // mask off sign bits
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1848
  while(bit_width < 64) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1849
    val |= (val << bit_width);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1850
    bit_width <<= 1;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1851
  }
40040
7644f470d923 8160425: Vectorization with signalling NaN returns wrong result
thartmann
parents: 39253
diff changeset
  1852
  return val;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1853
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1854
11794
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1855
#ifndef PRODUCT
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1856
  void MachNopNode::format(PhaseRegAlloc*, outputStream* st) const {
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1857
    st->print("nop \t# %d bytes pad for loops and calls", _count);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1858
  }
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1859
#endif
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1860
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1861
  void MachNopNode::emit(CodeBuffer &cbuf, PhaseRegAlloc*) const {
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1862
    MacroAssembler _masm(&cbuf);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1863
    __ nop(_count);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1864
  }
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1865
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1866
  uint MachNopNode::size(PhaseRegAlloc*) const {
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1867
    return _count;
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1868
  }
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1869
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1870
#ifndef PRODUCT
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1871
  void MachBreakpointNode::format(PhaseRegAlloc*, outputStream* st) const {
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1872
    st->print("# breakpoint");
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1873
  }
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1874
#endif
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1875
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1876
  void MachBreakpointNode::emit(CodeBuffer &cbuf, PhaseRegAlloc* ra_) const {
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1877
    MacroAssembler _masm(&cbuf);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1878
    __ int3();
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1879
  }
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1880
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1881
  uint MachBreakpointNode::size(PhaseRegAlloc* ra_) const {
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1882
    return MachNode::size(ra_);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1883
  }
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1884
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1885
%}
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1886
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1887
encode %{
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1888
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1889
  enc_class call_epilog %{
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1890
    if (VerifyStackAtCalls) {
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1891
      // Check that stack depth is unchanged: find majik cookie on stack
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1892
      int framesize = ra_->reg2offset_unchecked(OptoReg::add(ra_->_matcher._old_SP, -3*VMRegImpl::slots_per_word));
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1893
      MacroAssembler _masm(&cbuf);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1894
      Label L;
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1895
      __ cmpptr(Address(rsp, framesize), (int32_t)0xbadb100d);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1896
      __ jccb(Assembler::equal, L);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1897
      // Die if stack mismatch
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1898
      __ int3();
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1899
      __ bind(L);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1900
    }
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1901
  %}
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1902
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1903
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1904
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1905
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1906
//----------OPERANDS-----------------------------------------------------------
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1907
// Operand definitions must precede instruction definitions for correct parsing
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1908
// in the ADLC because operands constitute user defined types which are used in
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1909
// instruction definitions.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1910
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1911
// This one generically applies only for evex, so only one version
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1912
operand vecZ() %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1913
  constraint(ALLOC_IN_RC(vectorz_reg));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  1914
  match(VecZ);
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1915
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1916
  format %{ %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1917
  interface(REG_INTER);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1918
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  1919
33469
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1920
// Comparison Code for FP conditional move
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1921
operand cmpOp_vcmppd() %{
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1922
  match(Bool);
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1923
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1924
  predicate(n->as_Bool()->_test._test != BoolTest::overflow &&
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1925
            n->as_Bool()->_test._test != BoolTest::no_overflow);
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1926
  format %{ "" %}
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1927
  interface(COND_INTER) %{
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1928
    equal        (0x0, "eq");
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1929
    less         (0x1, "lt");
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1930
    less_equal   (0x2, "le");
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1931
    not_equal    (0xC, "ne");
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1932
    greater_equal(0xD, "ge");
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1933
    greater      (0xE, "gt");
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1934
    //TODO cannot compile (adlc breaks) without two next lines with error:
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1935
    // x86_64.ad(13987) Syntax Error: :In operand cmpOp_vcmppd: Do not support this encode constant: ' %{
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1936
    // equal' for overflow.
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1937
    overflow     (0x20, "o");  // not really supported by the instruction
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1938
    no_overflow  (0x21, "no"); // not really supported by the instruction
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1939
  %}
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1940
%}
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1941
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  1942
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1943
// INSTRUCTIONS -- Platform independent definitions (same for 32- and 64-bit)
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1944
11794
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1945
// ============================================================================
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1946
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1947
instruct ShouldNotReachHere() %{
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1948
  match(Halt);
46525
3a5c833a43de 8176506: C2: loop unswitching and unsafe accesses cause crash
roland
parents: 46378
diff changeset
  1949
  format %{ "ud2\t# ShouldNotReachHere" %}
3a5c833a43de 8176506: C2: loop unswitching and unsafe accesses cause crash
roland
parents: 46378
diff changeset
  1950
  ins_encode %{
3a5c833a43de 8176506: C2: loop unswitching and unsafe accesses cause crash
roland
parents: 46378
diff changeset
  1951
    __ ud2();
11794
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1952
  %}
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1953
  ins_pipe(pipe_slow);
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1954
%}
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1955
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1956
// =================================EVEX special===============================
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1957
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1958
instruct setMask(rRegI dst, rRegI src) %{
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1959
  predicate(Matcher::has_predicated_vectors());
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1960
  match(Set dst (SetVectMaskI  src));
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1961
  effect(TEMP dst);
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1962
  format %{ "setvectmask   $dst, $src" %}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1963
  ins_encode %{
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1964
    __ setvectmask($dst$$Register, $src$$Register);
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1965
  %}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1966
  ins_pipe(pipe_slow);
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1967
%}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  1968
11794
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1969
// ============================================================================
72249bf6ab83 7145346: VerifyStackAtCalls is broken
kvn
parents: 11429
diff changeset
  1970
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1971
instruct addF_reg(regF dst, regF src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1972
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1973
  match(Set dst (AddF dst src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1974
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1975
  format %{ "addss   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1976
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1977
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1978
    __ addss($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1979
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1980
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1981
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1982
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1983
instruct addF_mem(regF dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1984
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1985
  match(Set dst (AddF dst (LoadF src)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1986
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1987
  format %{ "addss   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1988
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1989
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1990
    __ addss($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1991
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1992
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1993
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1994
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1995
instruct addF_imm(regF dst, immF con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1996
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1997
  match(Set dst (AddF dst con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1998
  format %{ "addss   $dst, [$constantaddress]\t# load from constant table: float=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  1999
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2000
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2001
    __ addss($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2002
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2003
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2004
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2005
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2006
instruct addF_reg_reg(regF dst, regF src1, regF src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2007
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2008
  match(Set dst (AddF src1 src2));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2009
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2010
  format %{ "vaddss  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2011
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2012
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2013
    __ vaddss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2014
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2015
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2016
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2017
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2018
instruct addF_reg_mem(regF dst, regF src1, memory src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2019
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2020
  match(Set dst (AddF src1 (LoadF src2)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2021
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2022
  format %{ "vaddss  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2023
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2024
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2025
    __ vaddss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2026
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2027
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2028
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2029
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2030
instruct addF_reg_imm(regF dst, regF src, immF con) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2031
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2032
  match(Set dst (AddF src con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2033
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2034
  format %{ "vaddss  $dst, $src, [$constantaddress]\t# load from constant table: float=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2035
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2036
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2037
    __ vaddss($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2038
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2039
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2040
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2041
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2042
instruct addD_reg(regD dst, regD src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2043
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2044
  match(Set dst (AddD dst src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2045
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2046
  format %{ "addsd   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2047
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2048
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2049
    __ addsd($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2050
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2051
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2052
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2053
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2054
instruct addD_mem(regD dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2055
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2056
  match(Set dst (AddD dst (LoadD src)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2057
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2058
  format %{ "addsd   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2059
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2060
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2061
    __ addsd($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2062
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2063
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2064
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2065
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2066
instruct addD_imm(regD dst, immD con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2067
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2068
  match(Set dst (AddD dst con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2069
  format %{ "addsd   $dst, [$constantaddress]\t# load from constant table: double=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2070
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2071
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2072
    __ addsd($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2073
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2074
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2075
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2076
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2077
instruct addD_reg_reg(regD dst, regD src1, regD src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2078
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2079
  match(Set dst (AddD src1 src2));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2080
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2081
  format %{ "vaddsd  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2082
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2083
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2084
    __ vaddsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2085
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2086
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2087
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2088
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2089
instruct addD_reg_mem(regD dst, regD src1, memory src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2090
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2091
  match(Set dst (AddD src1 (LoadD src2)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2092
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2093
  format %{ "vaddsd  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2094
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2095
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2096
    __ vaddsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2097
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2098
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2099
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2100
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2101
instruct addD_reg_imm(regD dst, regD src, immD con) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2102
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2103
  match(Set dst (AddD src con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2104
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2105
  format %{ "vaddsd  $dst, $src, [$constantaddress]\t# load from constant table: double=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2106
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2107
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2108
    __ vaddsd($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2109
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2110
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2111
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2112
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2113
instruct subF_reg(regF dst, regF src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2114
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2115
  match(Set dst (SubF dst src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2116
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2117
  format %{ "subss   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2118
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2119
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2120
    __ subss($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2121
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2122
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2123
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2124
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2125
instruct subF_mem(regF dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2126
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2127
  match(Set dst (SubF dst (LoadF src)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2128
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2129
  format %{ "subss   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2130
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2131
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2132
    __ subss($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2133
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2134
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2135
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2136
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2137
instruct subF_imm(regF dst, immF con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2138
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2139
  match(Set dst (SubF dst con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2140
  format %{ "subss   $dst, [$constantaddress]\t# load from constant table: float=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2141
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2142
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2143
    __ subss($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2144
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2145
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2146
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2147
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2148
instruct subF_reg_reg(regF dst, regF src1, regF src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2149
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2150
  match(Set dst (SubF src1 src2));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2151
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2152
  format %{ "vsubss  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2153
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2154
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2155
    __ vsubss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2156
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2157
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2158
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2159
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2160
instruct subF_reg_mem(regF dst, regF src1, memory src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2161
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2162
  match(Set dst (SubF src1 (LoadF src2)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2163
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2164
  format %{ "vsubss  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2165
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2166
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2167
    __ vsubss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2168
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2169
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2170
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2171
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2172
instruct subF_reg_imm(regF dst, regF src, immF con) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2173
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2174
  match(Set dst (SubF src con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2175
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2176
  format %{ "vsubss  $dst, $src, [$constantaddress]\t# load from constant table: float=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2177
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2178
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2179
    __ vsubss($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2180
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2181
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2182
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2183
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2184
instruct subD_reg(regD dst, regD src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2185
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2186
  match(Set dst (SubD dst src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2187
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2188
  format %{ "subsd   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2189
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2190
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2191
    __ subsd($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2192
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2193
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2194
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2195
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2196
instruct subD_mem(regD dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2197
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2198
  match(Set dst (SubD dst (LoadD src)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2199
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2200
  format %{ "subsd   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2201
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2202
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2203
    __ subsd($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2204
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2205
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2206
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2207
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2208
instruct subD_imm(regD dst, immD con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2209
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2210
  match(Set dst (SubD dst con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2211
  format %{ "subsd   $dst, [$constantaddress]\t# load from constant table: double=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2212
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2213
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2214
    __ subsd($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2215
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2216
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2217
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2218
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2219
instruct subD_reg_reg(regD dst, regD src1, regD src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2220
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2221
  match(Set dst (SubD src1 src2));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2222
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2223
  format %{ "vsubsd  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2224
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2225
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2226
    __ vsubsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2227
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2228
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2229
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2230
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2231
instruct subD_reg_mem(regD dst, regD src1, memory src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2232
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2233
  match(Set dst (SubD src1 (LoadD src2)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2234
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2235
  format %{ "vsubsd  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2236
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2237
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2238
    __ vsubsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2239
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2240
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2241
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2242
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2243
instruct subD_reg_imm(regD dst, regD src, immD con) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2244
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2245
  match(Set dst (SubD src con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2246
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2247
  format %{ "vsubsd  $dst, $src, [$constantaddress]\t# load from constant table: double=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2248
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2249
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2250
    __ vsubsd($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2251
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2252
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2253
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2254
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2255
instruct mulF_reg(regF dst, regF src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2256
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2257
  match(Set dst (MulF dst src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2258
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2259
  format %{ "mulss   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2260
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2261
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2262
    __ mulss($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2263
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2264
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2265
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2266
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2267
instruct mulF_mem(regF dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2268
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2269
  match(Set dst (MulF dst (LoadF src)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2270
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2271
  format %{ "mulss   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2272
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2273
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2274
    __ mulss($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2275
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2276
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2277
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2278
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2279
instruct mulF_imm(regF dst, immF con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2280
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2281
  match(Set dst (MulF dst con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2282
  format %{ "mulss   $dst, [$constantaddress]\t# load from constant table: float=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2283
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2284
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2285
    __ mulss($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2286
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2287
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2288
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2289
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2290
instruct mulF_reg_reg(regF dst, regF src1, regF src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2291
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2292
  match(Set dst (MulF src1 src2));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2293
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2294
  format %{ "vmulss  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2295
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2296
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2297
    __ vmulss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2298
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2299
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2300
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2301
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2302
instruct mulF_reg_mem(regF dst, regF src1, memory src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2303
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2304
  match(Set dst (MulF src1 (LoadF src2)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2305
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2306
  format %{ "vmulss  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2307
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2308
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2309
    __ vmulss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2310
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2311
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2312
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2313
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2314
instruct mulF_reg_imm(regF dst, regF src, immF con) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2315
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2316
  match(Set dst (MulF src con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2317
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2318
  format %{ "vmulss  $dst, $src, [$constantaddress]\t# load from constant table: float=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2319
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2320
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2321
    __ vmulss($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2322
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2323
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2324
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2325
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2326
instruct mulD_reg(regD dst, regD src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2327
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2328
  match(Set dst (MulD dst src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2329
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2330
  format %{ "mulsd   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2331
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2332
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2333
    __ mulsd($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2334
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2335
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2336
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2337
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2338
instruct mulD_mem(regD dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2339
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2340
  match(Set dst (MulD dst (LoadD src)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2341
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2342
  format %{ "mulsd   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2343
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2344
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2345
    __ mulsd($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2346
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2347
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2348
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2349
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2350
instruct mulD_imm(regD dst, immD con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2351
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2352
  match(Set dst (MulD dst con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2353
  format %{ "mulsd   $dst, [$constantaddress]\t# load from constant table: double=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2354
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2355
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2356
    __ mulsd($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2357
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2358
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2359
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2360
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2361
instruct mulD_reg_reg(regD dst, regD src1, regD src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2362
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2363
  match(Set dst (MulD src1 src2));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2364
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2365
  format %{ "vmulsd  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2366
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2367
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2368
    __ vmulsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2369
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2370
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2371
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2372
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2373
instruct mulD_reg_mem(regD dst, regD src1, memory src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2374
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2375
  match(Set dst (MulD src1 (LoadD src2)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2376
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2377
  format %{ "vmulsd  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2378
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2379
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2380
    __ vmulsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2381
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2382
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2383
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2384
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2385
instruct mulD_reg_imm(regD dst, regD src, immD con) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2386
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2387
  match(Set dst (MulD src con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2388
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2389
  format %{ "vmulsd  $dst, $src, [$constantaddress]\t# load from constant table: double=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2390
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2391
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2392
    __ vmulsd($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2393
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2394
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2395
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2396
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2397
instruct divF_reg(regF dst, regF src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2398
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2399
  match(Set dst (DivF dst src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2400
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2401
  format %{ "divss   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2402
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2403
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2404
    __ divss($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2405
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2406
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2407
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2408
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2409
instruct divF_mem(regF dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2410
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2411
  match(Set dst (DivF dst (LoadF src)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2412
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2413
  format %{ "divss   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2414
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2415
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2416
    __ divss($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2417
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2418
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2419
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2420
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2421
instruct divF_imm(regF dst, immF con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2422
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2423
  match(Set dst (DivF dst con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2424
  format %{ "divss   $dst, [$constantaddress]\t# load from constant table: float=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2425
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2426
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2427
    __ divss($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2428
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2429
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2430
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2431
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2432
instruct divF_reg_reg(regF dst, regF src1, regF src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2433
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2434
  match(Set dst (DivF src1 src2));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2435
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2436
  format %{ "vdivss  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2437
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2438
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2439
    __ vdivss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2440
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2441
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2442
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2443
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2444
instruct divF_reg_mem(regF dst, regF src1, memory src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2445
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2446
  match(Set dst (DivF src1 (LoadF src2)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2447
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2448
  format %{ "vdivss  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2449
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2450
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2451
    __ vdivss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2452
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2453
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2454
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2455
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2456
instruct divF_reg_imm(regF dst, regF src, immF con) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2457
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2458
  match(Set dst (DivF src con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2459
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2460
  format %{ "vdivss  $dst, $src, [$constantaddress]\t# load from constant table: float=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2461
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2462
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2463
    __ vdivss($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2464
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2465
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2466
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2467
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2468
instruct divD_reg(regD dst, regD src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2469
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2470
  match(Set dst (DivD dst src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2471
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2472
  format %{ "divsd   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2473
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2474
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2475
    __ divsd($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2476
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2477
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2478
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2479
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2480
instruct divD_mem(regD dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2481
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2482
  match(Set dst (DivD dst (LoadD src)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2483
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2484
  format %{ "divsd   $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2485
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2486
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2487
    __ divsd($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2488
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2489
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2490
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2491
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2492
instruct divD_imm(regD dst, immD con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2493
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2494
  match(Set dst (DivD dst con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2495
  format %{ "divsd   $dst, [$constantaddress]\t# load from constant table: double=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2496
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2497
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2498
    __ divsd($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2499
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2500
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2501
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2502
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2503
instruct divD_reg_reg(regD dst, regD src1, regD src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2504
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2505
  match(Set dst (DivD src1 src2));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2506
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2507
  format %{ "vdivsd  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2508
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2509
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2510
    __ vdivsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2511
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2512
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2513
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2514
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2515
instruct divD_reg_mem(regD dst, regD src1, memory src2) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2516
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2517
  match(Set dst (DivD src1 (LoadD src2)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2518
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2519
  format %{ "vdivsd  $dst, $src1, $src2" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2520
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2521
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2522
    __ vdivsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2523
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2524
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2525
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2526
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2527
instruct divD_reg_imm(regD dst, regD src, immD con) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2528
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2529
  match(Set dst (DivD src con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2530
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2531
  format %{ "vdivsd  $dst, $src, [$constantaddress]\t# load from constant table: double=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2532
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2533
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2534
    __ vdivsd($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2535
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2536
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2537
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2538
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2539
instruct absF_reg(regF dst) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2540
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2541
  match(Set dst (AbsF dst));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2542
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2543
  format %{ "andps   $dst, [0x7fffffff]\t# abs float by sign masking" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2544
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2545
    __ andps($dst$$XMMRegister, ExternalAddress(float_signmask()));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2546
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2547
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2548
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2549
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2550
instruct absF_reg_reg(regF dst, regF src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2551
  predicate(VM_Version::supports_avxonly());
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2552
  match(Set dst (AbsF src));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2553
  ins_cost(150);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2554
  format %{ "vandps  $dst, $src, [0x7fffffff]\t# abs float by sign masking" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2555
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2556
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2557
    __ vandps($dst$$XMMRegister, $src$$XMMRegister,
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2558
              ExternalAddress(float_signmask()), vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2559
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2560
  ins_pipe(pipe_slow);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2561
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2562
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2563
#ifdef _LP64
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2564
instruct absF_reg_reg_evex(regF dst, regF src) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2565
  predicate(UseAVX > 2 && VM_Version::supports_avx512vl());
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2566
  match(Set dst (AbsF src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2567
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2568
  format %{ "vandps  $dst, $src, [0x7fffffff]\t# abs float by sign masking" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2569
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2570
    int vector_len = 0;
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2571
    __ vandps($dst$$XMMRegister, $src$$XMMRegister,
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2572
              ExternalAddress(float_signmask()), vector_len);
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2573
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2574
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2575
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2576
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2577
instruct absF_reg_reg_evex_special(regF dst, regF src1, regF src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2578
  predicate(VM_Version::supports_avx512novl());
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2579
  match(Set dst (AbsF src1));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2580
  effect(TEMP src2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2581
  ins_cost(150);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2582
  format %{ "vabsss  $dst, $src1, $src2, [0x7fffffff]\t# abs float by sign masking" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2583
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2584
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2585
    __ vabsss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister,
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2586
              ExternalAddress(float_signmask()), vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2587
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2588
  ins_pipe(pipe_slow);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2589
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2590
#else // _LP64
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2591
instruct absF_reg_reg_evex(regF dst, regF src) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2592
  predicate(UseAVX > 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2593
  match(Set dst (AbsF src));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2594
  ins_cost(150);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2595
  format %{ "vandps  $dst, $src, [0x7fffffff]\t# abs float by sign masking" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2596
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2597
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2598
    __ vandps($dst$$XMMRegister, $src$$XMMRegister,
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2599
              ExternalAddress(float_signmask()), vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2600
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2601
  ins_pipe(pipe_slow);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2602
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2603
#endif
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2604
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2605
instruct absD_reg(regD dst) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2606
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2607
  match(Set dst (AbsD dst));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2608
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2609
  format %{ "andpd   $dst, [0x7fffffffffffffff]\t"
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2610
            "# abs double by sign masking" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2611
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2612
    __ andpd($dst$$XMMRegister, ExternalAddress(double_signmask()));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2613
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2614
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2615
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2616
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2617
instruct absD_reg_reg(regD dst, regD src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2618
  predicate(VM_Version::supports_avxonly());
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2619
  match(Set dst (AbsD src));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2620
  ins_cost(150);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2621
  format %{ "vandpd  $dst, $src, [0x7fffffffffffffff]\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2622
            "# abs double by sign masking" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2623
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2624
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2625
    __ vandpd($dst$$XMMRegister, $src$$XMMRegister,
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2626
              ExternalAddress(double_signmask()), vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2627
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2628
  ins_pipe(pipe_slow);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2629
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2630
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2631
#ifdef _LP64
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2632
instruct absD_reg_reg_evex(regD dst, regD src) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2633
  predicate(UseAVX > 2 && VM_Version::supports_avx512vl());
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2634
  match(Set dst (AbsD src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2635
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2636
  format %{ "vandpd  $dst, $src, [0x7fffffffffffffff]\t"
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2637
            "# abs double by sign masking" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2638
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2639
    int vector_len = 0;
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2640
    __ vandpd($dst$$XMMRegister, $src$$XMMRegister,
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2641
              ExternalAddress(double_signmask()), vector_len);
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2642
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2643
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2644
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2645
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2646
instruct absD_reg_reg_evex_special(regD dst, regD src1, regD src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2647
  predicate(VM_Version::supports_avx512novl());
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2648
  match(Set dst (AbsD src1));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2649
  effect(TEMP src2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2650
  ins_cost(150);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2651
  format %{ "vabssd  $dst, $src1, $src2, [0x7fffffffffffffff]\t# abs float by sign masking" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2652
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2653
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2654
    __ vabssd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister,
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2655
              ExternalAddress(double_signmask()), vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2656
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2657
  ins_pipe(pipe_slow);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2658
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2659
#else // _LP64
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2660
instruct absD_reg_reg_evex(regD dst, regD src) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2661
  predicate(UseAVX > 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2662
  match(Set dst (AbsD src));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2663
  ins_cost(150);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2664
  format %{ "vandpd  $dst, $src, [0x7fffffffffffffff]\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2665
            "# abs double by sign masking" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2666
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2667
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2668
    __ vandpd($dst$$XMMRegister, $src$$XMMRegister,
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2669
              ExternalAddress(double_signmask()), vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2670
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2671
  ins_pipe(pipe_slow);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2672
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2673
#endif
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  2674
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2675
instruct negF_reg(regF dst) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2676
  predicate((UseSSE>=1) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2677
  match(Set dst (NegF dst));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2678
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2679
  format %{ "xorps   $dst, [0x80000000]\t# neg float by sign flipping" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2680
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2681
    __ xorps($dst$$XMMRegister, ExternalAddress(float_signflip()));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2682
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2683
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2684
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2685
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2686
instruct negF_reg_reg(regF dst, regF src) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2687
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2688
  match(Set dst (NegF src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2689
  ins_cost(150);
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  2690
  format %{ "vnegatess  $dst, $src, [0x80000000]\t# neg float by sign flipping" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  2691
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  2692
    __ vnegatess($dst$$XMMRegister, $src$$XMMRegister,
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  2693
                 ExternalAddress(float_signflip()));
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2694
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2695
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2696
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2697
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2698
instruct negD_reg(regD dst) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2699
  predicate((UseSSE>=2) && (UseAVX == 0));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2700
  match(Set dst (NegD dst));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2701
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2702
  format %{ "xorpd   $dst, [0x8000000000000000]\t"
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2703
            "# neg double by sign flipping" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2704
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2705
    __ xorpd($dst$$XMMRegister, ExternalAddress(double_signflip()));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2706
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2707
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2708
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2709
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  2710
instruct negD_reg_reg(regD dst, regD src) %{
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2711
  predicate(UseAVX > 0);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2712
  match(Set dst (NegD src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2713
  ins_cost(150);
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  2714
  format %{ "vnegatess  $dst, $src, [0x8000000000000000]\t"
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2715
            "# neg double by sign flipping" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2716
  ins_encode %{
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  2717
    __ vnegatesd($dst$$XMMRegister, $src$$XMMRegister,
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  2718
                 ExternalAddress(double_signflip()));
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2719
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2720
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2721
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2722
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2723
instruct sqrtF_reg(regF dst, regF src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2724
  predicate(UseSSE>=1);
48089
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  2725
  match(Set dst (SqrtF src));
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2726
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2727
  format %{ "sqrtss  $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2728
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2729
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2730
    __ sqrtss($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2731
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2732
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2733
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2734
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2735
instruct sqrtF_mem(regF dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2736
  predicate(UseSSE>=1);
48089
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  2737
  match(Set dst (SqrtF (LoadF src)));
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2738
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2739
  format %{ "sqrtss  $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2740
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2741
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2742
    __ sqrtss($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2743
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2744
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2745
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2746
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2747
instruct sqrtF_imm(regF dst, immF con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2748
  predicate(UseSSE>=1);
48089
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  2749
  match(Set dst (SqrtF con));
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  2750
11429
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2751
  format %{ "sqrtss  $dst, [$constantaddress]\t# load from constant table: float=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2752
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2753
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2754
    __ sqrtss($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2755
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2756
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2757
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2758
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2759
instruct sqrtD_reg(regD dst, regD src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2760
  predicate(UseSSE>=2);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2761
  match(Set dst (SqrtD src));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2762
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2763
  format %{ "sqrtsd  $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2764
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2765
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2766
    __ sqrtsd($dst$$XMMRegister, $src$$XMMRegister);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2767
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2768
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2769
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2770
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2771
instruct sqrtD_mem(regD dst, memory src) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2772
  predicate(UseSSE>=2);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2773
  match(Set dst (SqrtD (LoadD src)));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2774
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2775
  format %{ "sqrtsd  $dst, $src" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2776
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2777
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2778
    __ sqrtsd($dst$$XMMRegister, $src$$Address);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2779
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2780
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2781
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2782
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2783
instruct sqrtD_imm(regD dst, immD con) %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2784
  predicate(UseSSE>=2);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2785
  match(Set dst (SqrtD con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2786
  format %{ "sqrtsd  $dst, [$constantaddress]\t# load from constant table: double=$con" %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2787
  ins_cost(150);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2788
  ins_encode %{
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2789
    __ sqrtsd($dst$$XMMRegister, $constantaddress($con));
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2790
  %}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2791
  ins_pipe(pipe_slow);
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2792
%}
e894217a5d94 7121648: Use 3-operands SIMD instructions on x86 with AVX
kvn
parents:
diff changeset
  2793
38017
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2794
instruct onspinwait() %{
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2795
  match(OnSpinWait);
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2796
  ins_cost(200);
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2797
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2798
  format %{
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2799
    $$template
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2800
    if (os::is_MP()) {
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2801
      $$emit$$"pause\t! membar_onspinwait"
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2802
    } else {
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2803
      $$emit$$"MEMBAR-onspinwait ! (empty encoding)"
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2804
    }
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2805
  %}
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2806
  ins_encode %{
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2807
    __ pause();
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2808
  %}
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2809
  ins_pipe(pipe_slow);
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2810
%}
55047d16f141 8147844: new method j.l.Runtime.onSpinWait() and the corresponding x86 hotspot instrinsic
ikrylov
parents: 36561
diff changeset
  2811
41323
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2812
// a * b + c
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2813
instruct fmaD_reg(regD a, regD b, regD c) %{
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2814
  predicate(UseFMA);
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2815
  match(Set c (FmaD  c (Binary a b)));
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2816
  format %{ "fmasd $a,$b,$c\t# $c = $a * $b + $c" %}
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2817
  ins_cost(150);
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2818
  ins_encode %{
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2819
    __ fmad($c$$XMMRegister, $a$$XMMRegister, $b$$XMMRegister, $c$$XMMRegister);
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2820
  %}
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2821
  ins_pipe( pipe_slow );
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2822
%}
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2823
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2824
// a * b + c
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2825
instruct fmaF_reg(regF a, regF b, regF c) %{
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2826
  predicate(UseFMA);
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2827
  match(Set c (FmaF  c (Binary a b)));
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2828
  format %{ "fmass $a,$b,$c\t# $c = $a * $b + $c" %}
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2829
  ins_cost(150);
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2830
  ins_encode %{
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2831
    __ fmaf($c$$XMMRegister, $a$$XMMRegister, $b$$XMMRegister, $c$$XMMRegister);
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2832
  %}
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2833
  ins_pipe( pipe_slow );
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2834
%}
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 40040
diff changeset
  2835
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2836
// ====================VECTOR INSTRUCTIONS=====================================
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2837
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2838
// Load vectors (4 bytes long)
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2839
instruct loadV4(vecS dst, memory mem) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2840
  predicate(n->as_LoadVector()->memory_size() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2841
  match(Set dst (LoadVector mem));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2842
  ins_cost(125);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2843
  format %{ "movd    $dst,$mem\t! load vector (4 bytes)" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2844
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2845
    __ movdl($dst$$XMMRegister, $mem$$Address);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2846
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2847
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2848
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2849
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2850
// Load vectors (8 bytes long)
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2851
instruct loadV8(vecD dst, memory mem) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2852
  predicate(n->as_LoadVector()->memory_size() == 8);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2853
  match(Set dst (LoadVector mem));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2854
  ins_cost(125);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2855
  format %{ "movq    $dst,$mem\t! load vector (8 bytes)" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2856
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2857
    __ movq($dst$$XMMRegister, $mem$$Address);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2858
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2859
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2860
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2861
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2862
// Load vectors (16 bytes long)
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2863
instruct loadV16(vecX dst, memory mem) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2864
  predicate(n->as_LoadVector()->memory_size() == 16);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2865
  match(Set dst (LoadVector mem));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2866
  ins_cost(125);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2867
  format %{ "movdqu  $dst,$mem\t! load vector (16 bytes)" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2868
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2869
    __ movdqu($dst$$XMMRegister, $mem$$Address);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2870
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2871
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2872
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2873
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2874
// Load vectors (32 bytes long)
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2875
instruct loadV32(vecY dst, memory mem) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2876
  predicate(n->as_LoadVector()->memory_size() == 32);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2877
  match(Set dst (LoadVector mem));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2878
  ins_cost(125);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2879
  format %{ "vmovdqu $dst,$mem\t! load vector (32 bytes)" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2880
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2881
    __ vmovdqu($dst$$XMMRegister, $mem$$Address);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2882
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2883
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2884
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2885
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2886
// Load vectors (64 bytes long)
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2887
instruct loadV64_dword(vecZ dst, memory mem) %{
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2888
  predicate(n->as_LoadVector()->memory_size() == 64 && n->as_LoadVector()->element_size() <= 4);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2889
  match(Set dst (LoadVector mem));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2890
  ins_cost(125);
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2891
  format %{ "vmovdqul $dst k0,$mem\t! load vector (64 bytes)" %}
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2892
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2893
    int vector_len = 2;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  2894
    __ evmovdqul($dst$$XMMRegister, $mem$$Address, vector_len);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2895
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2896
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2897
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2898
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2899
// Load vectors (64 bytes long)
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2900
instruct loadV64_qword(vecZ dst, memory mem) %{
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2901
  predicate(n->as_LoadVector()->memory_size() == 64 && n->as_LoadVector()->element_size() > 4);
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2902
  match(Set dst (LoadVector mem));
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2903
  ins_cost(125);
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2904
  format %{ "vmovdquq $dst k0,$mem\t! load vector (64 bytes)" %}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2905
  ins_encode %{
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2906
    int vector_len = 2;
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2907
    __ evmovdquq($dst$$XMMRegister, $mem$$Address, vector_len);
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2908
  %}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2909
  ins_pipe( pipe_slow );
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2910
%}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2911
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2912
// Store vectors
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2913
instruct storeV4(memory mem, vecS src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2914
  predicate(n->as_StoreVector()->memory_size() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2915
  match(Set mem (StoreVector mem src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2916
  ins_cost(145);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2917
  format %{ "movd    $mem,$src\t! store vector (4 bytes)" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2918
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2919
    __ movdl($mem$$Address, $src$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2920
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2921
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2922
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2923
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2924
instruct storeV8(memory mem, vecD src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2925
  predicate(n->as_StoreVector()->memory_size() == 8);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2926
  match(Set mem (StoreVector mem src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2927
  ins_cost(145);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2928
  format %{ "movq    $mem,$src\t! store vector (8 bytes)" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2929
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2930
    __ movq($mem$$Address, $src$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2931
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2932
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2933
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2934
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2935
instruct storeV16(memory mem, vecX src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2936
  predicate(n->as_StoreVector()->memory_size() == 16);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2937
  match(Set mem (StoreVector mem src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2938
  ins_cost(145);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2939
  format %{ "movdqu  $mem,$src\t! store vector (16 bytes)" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2940
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2941
    __ movdqu($mem$$Address, $src$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2942
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2943
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2944
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2945
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2946
instruct storeV32(memory mem, vecY src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2947
  predicate(n->as_StoreVector()->memory_size() == 32);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2948
  match(Set mem (StoreVector mem src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2949
  ins_cost(145);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2950
  format %{ "vmovdqu $mem,$src\t! store vector (32 bytes)" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2951
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2952
    __ vmovdqu($mem$$Address, $src$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2953
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2954
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2955
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  2956
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2957
instruct storeV64_dword(memory mem, vecZ src) %{
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2958
  predicate(n->as_StoreVector()->memory_size() == 64 && n->as_StoreVector()->element_size() <= 4);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2959
  match(Set mem (StoreVector mem src));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2960
  ins_cost(145);
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2961
  format %{ "vmovdqul $mem k0,$src\t! store vector (64 bytes)" %}
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2962
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2963
    int vector_len = 2;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  2964
    __ evmovdqul($mem$$Address, $src$$XMMRegister, vector_len);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2965
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2966
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2967
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  2968
38049
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2969
instruct storeV64_qword(memory mem, vecZ src) %{
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2970
  predicate(n->as_StoreVector()->memory_size() == 64 && n->as_StoreVector()->element_size() > 4);
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2971
  match(Set mem (StoreVector mem src));
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2972
  ins_cost(145);
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2973
  format %{ "vmovdquq $mem k0,$src\t! store vector (64 bytes)" %}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2974
  ins_encode %{
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2975
    int vector_len = 2;
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2976
    __ evmovdquq($mem$$Address, $src$$XMMRegister, vector_len);
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2977
  %}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2978
  ins_pipe( pipe_slow );
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2979
%}
e8541793960f 8153998: Masked vector post loops
mcberg
parents: 38017
diff changeset
  2980
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2981
// ====================LEGACY REPLICATE=======================================
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2982
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2983
instruct Repl4B_mem(vecS dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2984
  predicate(n->as_Vector()->length() == 4 && UseAVX > 0 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2985
  match(Set dst (ReplicateB (LoadB mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2986
  format %{ "punpcklbw $dst,$mem\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2987
            "pshuflw $dst,$dst,0x00\t! replicate4B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2988
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2989
    __ punpcklbw($dst$$XMMRegister, $mem$$Address);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2990
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2991
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2992
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2993
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2994
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2995
instruct Repl8B_mem(vecD dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2996
  predicate(n->as_Vector()->length() == 8 && UseAVX > 0 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2997
  match(Set dst (ReplicateB (LoadB mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2998
  format %{ "punpcklbw $dst,$mem\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  2999
            "pshuflw $dst,$dst,0x00\t! replicate8B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3000
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3001
    __ punpcklbw($dst$$XMMRegister, $mem$$Address);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3002
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3003
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3004
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3005
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3006
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3007
instruct Repl16B(vecX dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3008
  predicate(n->as_Vector()->length() == 16 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3009
  match(Set dst (ReplicateB src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3010
  format %{ "movd    $dst,$src\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3011
            "punpcklbw $dst,$dst\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3012
            "pshuflw $dst,$dst,0x00\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3013
            "punpcklqdq $dst,$dst\t! replicate16B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3014
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3015
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3016
    __ punpcklbw($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3017
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3018
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3019
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3020
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3021
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3022
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3023
instruct Repl16B_mem(vecX dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3024
  predicate(n->as_Vector()->length() == 16 && UseAVX > 0 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3025
  match(Set dst (ReplicateB (LoadB mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3026
  format %{ "punpcklbw $dst,$mem\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3027
            "pshuflw $dst,$dst,0x00\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3028
            "punpcklqdq $dst,$dst\t! replicate16B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3029
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3030
    __ punpcklbw($dst$$XMMRegister, $mem$$Address);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3031
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3032
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3033
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3034
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3035
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3036
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3037
instruct Repl32B(vecY dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3038
  predicate(n->as_Vector()->length() == 32 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3039
  match(Set dst (ReplicateB src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3040
  format %{ "movd    $dst,$src\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3041
            "punpcklbw $dst,$dst\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3042
            "pshuflw $dst,$dst,0x00\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3043
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3044
            "vinserti128_high $dst,$dst\t! replicate32B" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3045
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3046
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3047
    __ punpcklbw($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3048
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3049
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3050
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3051
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3052
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3053
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3054
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3055
instruct Repl32B_mem(vecY dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3056
  predicate(n->as_Vector()->length() == 32 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3057
  match(Set dst (ReplicateB (LoadB mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3058
  format %{ "punpcklbw $dst,$mem\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3059
            "pshuflw $dst,$dst,0x00\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3060
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3061
            "vinserti128_high $dst,$dst\t! replicate32B" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3062
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3063
    __ punpcklbw($dst$$XMMRegister, $mem$$Address);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3064
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3065
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3066
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3067
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3068
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3069
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3070
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3071
instruct Repl16B_imm(vecX dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3072
  predicate(n->as_Vector()->length() == 16 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3073
  match(Set dst (ReplicateB con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3074
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3075
            "punpcklqdq $dst,$dst\t! replicate16B($con)" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3076
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3077
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 1)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3078
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3079
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3080
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3081
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3082
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3083
instruct Repl32B_imm(vecY dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3084
  predicate(n->as_Vector()->length() == 32 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3085
  match(Set dst (ReplicateB con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3086
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3087
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3088
            "vinserti128_high $dst,$dst\t! lreplicate32B($con)" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3089
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3090
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 1)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3091
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3092
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3093
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3094
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3095
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3096
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3097
instruct Repl4S(vecD dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3098
  predicate(n->as_Vector()->length() == 4 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3099
  match(Set dst (ReplicateS src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3100
  format %{ "movd    $dst,$src\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3101
            "pshuflw $dst,$dst,0x00\t! replicate4S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3102
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3103
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3104
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3105
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3106
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3107
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3108
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3109
instruct Repl4S_mem(vecD dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3110
  predicate(n->as_Vector()->length() == 4 && UseAVX > 0 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3111
  match(Set dst (ReplicateS (LoadS mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3112
  format %{ "pshuflw $dst,$mem,0x00\t! replicate4S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3113
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3114
    __ pshuflw($dst$$XMMRegister, $mem$$Address, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3115
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3116
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3117
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3118
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3119
instruct Repl8S(vecX dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3120
  predicate(n->as_Vector()->length() == 8 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3121
  match(Set dst (ReplicateS src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3122
  format %{ "movd    $dst,$src\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3123
            "pshuflw $dst,$dst,0x00\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3124
            "punpcklqdq $dst,$dst\t! replicate8S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3125
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3126
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3127
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3128
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3129
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3130
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3131
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3132
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3133
instruct Repl8S_mem(vecX dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3134
  predicate(n->as_Vector()->length() == 8 && UseAVX > 0 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3135
  match(Set dst (ReplicateS (LoadS mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3136
  format %{ "pshuflw $dst,$mem,0x00\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3137
            "punpcklqdq $dst,$dst\t! replicate8S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3138
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3139
    __ pshuflw($dst$$XMMRegister, $mem$$Address, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3140
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3141
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3142
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3143
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3144
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3145
instruct Repl8S_imm(vecX dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3146
  predicate(n->as_Vector()->length() == 8 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3147
  match(Set dst (ReplicateS con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3148
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3149
            "punpcklqdq $dst,$dst\t! replicate8S($con)" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3150
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3151
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 2)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3152
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3153
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3154
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3155
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3156
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3157
instruct Repl16S(vecY dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3158
  predicate(n->as_Vector()->length() == 16 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3159
  match(Set dst (ReplicateS src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3160
  format %{ "movd    $dst,$src\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3161
            "pshuflw $dst,$dst,0x00\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3162
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3163
            "vinserti128_high $dst,$dst\t! replicate16S" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3164
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3165
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3166
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3167
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3168
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3169
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3170
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3171
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3172
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3173
instruct Repl16S_mem(vecY dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3174
  predicate(n->as_Vector()->length() == 16 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3175
  match(Set dst (ReplicateS (LoadS mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3176
  format %{ "pshuflw $dst,$mem,0x00\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3177
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3178
            "vinserti128_high $dst,$dst\t! replicate16S" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3179
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3180
    __ pshuflw($dst$$XMMRegister, $mem$$Address, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3181
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3182
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3183
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3184
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3185
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3186
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3187
instruct Repl16S_imm(vecY dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3188
  predicate(n->as_Vector()->length() == 16 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3189
  match(Set dst (ReplicateS con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3190
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3191
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3192
            "vinserti128_high $dst,$dst\t! replicate16S($con)" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3193
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3194
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 2)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3195
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3196
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3197
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3198
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3199
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3200
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3201
instruct Repl4I(vecX dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3202
  predicate(n->as_Vector()->length() == 4 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3203
  match(Set dst (ReplicateI src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3204
  format %{ "movd    $dst,$src\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3205
            "pshufd  $dst,$dst,0x00\t! replicate4I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3206
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3207
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3208
    __ pshufd($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3209
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3210
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3211
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3212
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3213
instruct Repl4I_mem(vecX dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3214
  predicate(n->as_Vector()->length() == 4 && UseAVX > 0 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3215
  match(Set dst (ReplicateI (LoadI mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3216
  format %{ "pshufd  $dst,$mem,0x00\t! replicate4I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3217
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3218
    __ pshufd($dst$$XMMRegister, $mem$$Address, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3219
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3220
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3221
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3222
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3223
instruct Repl8I(vecY dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3224
  predicate(n->as_Vector()->length() == 8 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3225
  match(Set dst (ReplicateI src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3226
  format %{ "movd    $dst,$src\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3227
            "pshufd  $dst,$dst,0x00\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3228
            "vinserti128_high $dst,$dst\t! replicate8I" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3229
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3230
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3231
    __ pshufd($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3232
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3233
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3234
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3235
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3236
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3237
instruct Repl8I_mem(vecY dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3238
  predicate(n->as_Vector()->length() == 8 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3239
  match(Set dst (ReplicateI (LoadI mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3240
  format %{ "pshufd  $dst,$mem,0x00\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3241
            "vinserti128_high $dst,$dst\t! replicate8I" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3242
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3243
    __ pshufd($dst$$XMMRegister, $mem$$Address, 0x00);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3244
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3245
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3246
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3247
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3248
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3249
instruct Repl4I_imm(vecX dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3250
  predicate(n->as_Vector()->length() == 4 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3251
  match(Set dst (ReplicateI con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3252
  format %{ "movq    $dst,[$constantaddress]\t! replicate4I($con)\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3253
            "punpcklqdq $dst,$dst" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3254
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3255
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 4)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3256
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3257
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3258
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3259
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3260
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3261
instruct Repl8I_imm(vecY dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3262
  predicate(n->as_Vector()->length() == 8 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3263
  match(Set dst (ReplicateI con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3264
  format %{ "movq    $dst,[$constantaddress]\t! replicate8I($con)\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3265
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3266
            "vinserti128_high $dst,$dst" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3267
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3268
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 4)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3269
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3270
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3271
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3272
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3273
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3274
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3275
// Long could be loaded into xmm register directly from memory.
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3276
instruct Repl2L_mem(vecX dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3277
  predicate(n->as_Vector()->length() == 2 && !VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3278
  match(Set dst (ReplicateL (LoadL mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3279
  format %{ "movq    $dst,$mem\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3280
            "punpcklqdq $dst,$dst\t! replicate2L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3281
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3282
    __ movq($dst$$XMMRegister, $mem$$Address);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3283
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3284
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3285
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3286
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3287
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3288
// Replicate long (8 byte) scalar to be vector
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3289
#ifdef _LP64
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3290
instruct Repl4L(vecY dst, rRegL src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3291
  predicate(n->as_Vector()->length() == 4 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3292
  match(Set dst (ReplicateL src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3293
  format %{ "movdq   $dst,$src\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3294
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3295
            "vinserti128_high $dst,$dst\t! replicate4L" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3296
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3297
    __ movdq($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3298
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3299
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3300
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3301
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3302
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3303
#else // _LP64
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3304
instruct Repl4L(vecY dst, eRegL src, regD tmp) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3305
  predicate(n->as_Vector()->length() == 4 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3306
  match(Set dst (ReplicateL src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3307
  effect(TEMP dst, USE src, TEMP tmp);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3308
  format %{ "movdl   $dst,$src.lo\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3309
            "movdl   $tmp,$src.hi\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3310
            "punpckldq $dst,$tmp\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3311
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3312
            "vinserti128_high $dst,$dst\t! replicate4L" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3313
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3314
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3315
    __ movdl($tmp$$XMMRegister, HIGH_FROM_LOW($src$$Register));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3316
    __ punpckldq($dst$$XMMRegister, $tmp$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3317
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3318
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3319
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3320
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3321
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3322
#endif // _LP64
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3323
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3324
instruct Repl4L_imm(vecY dst, immL con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3325
  predicate(n->as_Vector()->length() == 4 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3326
  match(Set dst (ReplicateL con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3327
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3328
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3329
            "vinserti128_high $dst,$dst\t! replicate4L($con)" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3330
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3331
    __ movq($dst$$XMMRegister, $constantaddress($con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3332
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3333
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3334
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3335
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3336
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3337
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3338
instruct Repl4L_mem(vecY dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3339
  predicate(n->as_Vector()->length() == 4 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3340
  match(Set dst (ReplicateL (LoadL mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3341
  format %{ "movq    $dst,$mem\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3342
            "punpcklqdq $dst,$dst\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3343
            "vinserti128_high $dst,$dst\t! replicate4L" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3344
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3345
    __ movq($dst$$XMMRegister, $mem$$Address);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3346
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3347
    __ vinserti128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3348
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3349
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3350
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3351
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3352
instruct Repl2F_mem(vecD dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3353
  predicate(n->as_Vector()->length() == 2 && UseAVX > 0 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3354
  match(Set dst (ReplicateF (LoadF mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3355
  format %{ "pshufd  $dst,$mem,0x00\t! replicate2F" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3356
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3357
    __ pshufd($dst$$XMMRegister, $mem$$Address, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3358
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3359
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3360
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3361
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3362
instruct Repl4F_mem(vecX dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3363
  predicate(n->as_Vector()->length() == 4 && UseAVX > 0 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3364
  match(Set dst (ReplicateF (LoadF mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3365
  format %{ "pshufd  $dst,$mem,0x00\t! replicate4F" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3366
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3367
    __ pshufd($dst$$XMMRegister, $mem$$Address, 0x00);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3368
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3369
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3370
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3371
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3372
instruct Repl8F(vecY dst, regF src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3373
  predicate(n->as_Vector()->length() == 8 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3374
  match(Set dst (ReplicateF src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3375
  format %{ "pshufd  $dst,$src,0x00\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3376
            "vinsertf128_high $dst,$dst\t! replicate8F" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3377
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3378
    __ pshufd($dst$$XMMRegister, $src$$XMMRegister, 0x00);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3379
    __ vinsertf128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3380
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3381
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3382
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3383
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3384
instruct Repl8F_mem(vecY dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3385
  predicate(n->as_Vector()->length() == 8 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3386
  match(Set dst (ReplicateF (LoadF mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3387
  format %{ "pshufd  $dst,$mem,0x00\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3388
            "vinsertf128_high $dst,$dst\t! replicate8F" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3389
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3390
    __ pshufd($dst$$XMMRegister, $mem$$Address, 0x00);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3391
    __ vinsertf128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3392
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3393
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3394
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3395
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3396
instruct Repl2F_zero(vecD dst, immF0 zero) %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3397
  predicate(n->as_Vector()->length() == 2 && UseAVX < 3);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3398
  match(Set dst (ReplicateF zero));
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3399
  format %{ "xorps   $dst,$dst\t! replicate2F zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3400
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3401
    __ xorps($dst$$XMMRegister, $dst$$XMMRegister);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3402
  %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3403
  ins_pipe( fpu_reg_reg );
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3404
%}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3405
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3406
instruct Repl4F_zero(vecX dst, immF0 zero) %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3407
  predicate(n->as_Vector()->length() == 4 && UseAVX < 3);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3408
  match(Set dst (ReplicateF zero));
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3409
  format %{ "xorps   $dst,$dst\t! replicate4F zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3410
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3411
    __ xorps($dst$$XMMRegister, $dst$$XMMRegister);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3412
  %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3413
  ins_pipe( fpu_reg_reg );
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3414
%}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3415
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3416
instruct Repl8F_zero(vecY dst, immF0 zero) %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3417
  predicate(n->as_Vector()->length() == 8 && UseAVX < 3);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3418
  match(Set dst (ReplicateF zero));
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3419
  format %{ "vxorps  $dst,$dst,$dst\t! replicate8F zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3420
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3421
    int vector_len = 1;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3422
    __ vxorps($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, vector_len);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3423
  %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3424
  ins_pipe( fpu_reg_reg );
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3425
%}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3426
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3427
instruct Repl2D_mem(vecX dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3428
  predicate(n->as_Vector()->length() == 2 && UseAVX > 0 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3429
  match(Set dst (ReplicateD (LoadD mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3430
  format %{ "pshufd  $dst,$mem,0x44\t! replicate2D" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3431
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3432
    __ pshufd($dst$$XMMRegister, $mem$$Address, 0x44);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3433
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3434
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3435
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3436
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3437
instruct Repl4D(vecY dst, regD src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3438
  predicate(n->as_Vector()->length() == 4 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3439
  match(Set dst (ReplicateD src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3440
  format %{ "pshufd  $dst,$src,0x44\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3441
            "vinsertf128_high $dst,$dst\t! replicate4D" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3442
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3443
    __ pshufd($dst$$XMMRegister, $src$$XMMRegister, 0x44);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3444
    __ vinsertf128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3445
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3446
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3447
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3448
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3449
instruct Repl4D_mem(vecY dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3450
  predicate(n->as_Vector()->length() == 4 && !VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3451
  match(Set dst (ReplicateD (LoadD mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3452
  format %{ "pshufd  $dst,$mem,0x44\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3453
            "vinsertf128_high $dst,$dst\t! replicate4D" %}
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3454
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3455
    __ pshufd($dst$$XMMRegister, $mem$$Address, 0x44);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  3456
    __ vinsertf128_high($dst$$XMMRegister, $dst$$XMMRegister);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3457
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3458
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3459
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3460
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3461
// Replicate double (8 byte) scalar zero to be vector
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3462
instruct Repl2D_zero(vecX dst, immD0 zero) %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3463
  predicate(n->as_Vector()->length() == 2 && UseAVX < 3);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3464
  match(Set dst (ReplicateD zero));
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3465
  format %{ "xorpd   $dst,$dst\t! replicate2D zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3466
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3467
    __ xorpd($dst$$XMMRegister, $dst$$XMMRegister);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3468
  %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3469
  ins_pipe( fpu_reg_reg );
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3470
%}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3471
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3472
instruct Repl4D_zero(vecY dst, immD0 zero) %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3473
  predicate(n->as_Vector()->length() == 4 && UseAVX < 3);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3474
  match(Set dst (ReplicateD zero));
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3475
  format %{ "vxorpd  $dst,$dst,$dst,vect256\t! replicate4D zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3476
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3477
    int vector_len = 1;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3478
    __ vxorpd($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, vector_len);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3479
  %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3480
  ins_pipe( fpu_reg_reg );
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3481
%}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3482
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3483
// ====================GENERIC REPLICATE==========================================
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3484
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3485
// Replicate byte scalar to be vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3486
instruct Repl4B(vecS dst, rRegI src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3487
  predicate(n->as_Vector()->length() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3488
  match(Set dst (ReplicateB src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3489
  format %{ "movd    $dst,$src\n\t"
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3490
            "punpcklbw $dst,$dst\n\t"
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3491
            "pshuflw $dst,$dst,0x00\t! replicate4B" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3492
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3493
    __ movdl($dst$$XMMRegister, $src$$Register);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3494
    __ punpcklbw($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3495
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3496
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3497
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3498
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3499
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3500
instruct Repl8B(vecD dst, rRegI src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3501
  predicate(n->as_Vector()->length() == 8);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3502
  match(Set dst (ReplicateB src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3503
  format %{ "movd    $dst,$src\n\t"
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3504
            "punpcklbw $dst,$dst\n\t"
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3505
            "pshuflw $dst,$dst,0x00\t! replicate8B" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3506
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3507
    __ movdl($dst$$XMMRegister, $src$$Register);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3508
    __ punpcklbw($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3509
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3510
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3511
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3512
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3513
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3514
// Replicate byte scalar immediate to be vector by loading from const table.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3515
instruct Repl4B_imm(vecS dst, immI con) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3516
  predicate(n->as_Vector()->length() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3517
  match(Set dst (ReplicateB con));
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3518
  format %{ "movdl   $dst,[$constantaddress]\t! replicate4B($con)" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3519
  ins_encode %{
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3520
    __ movdl($dst$$XMMRegister, $constantaddress(replicate4_imm($con$$constant, 1)));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3521
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3522
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3523
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3524
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3525
instruct Repl8B_imm(vecD dst, immI con) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3526
  predicate(n->as_Vector()->length() == 8);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3527
  match(Set dst (ReplicateB con));
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3528
  format %{ "movq    $dst,[$constantaddress]\t! replicate8B($con)" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3529
  ins_encode %{
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3530
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 1)));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3531
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3532
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3533
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3534
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3535
// Replicate byte scalar zero to be vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3536
instruct Repl4B_zero(vecS dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3537
  predicate(n->as_Vector()->length() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3538
  match(Set dst (ReplicateB zero));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3539
  format %{ "pxor    $dst,$dst\t! replicate4B zero" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3540
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3541
    __ pxor($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3542
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3543
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3544
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3545
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3546
instruct Repl8B_zero(vecD dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3547
  predicate(n->as_Vector()->length() == 8);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3548
  match(Set dst (ReplicateB zero));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3549
  format %{ "pxor    $dst,$dst\t! replicate8B zero" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3550
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3551
    __ pxor($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3552
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3553
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3554
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3555
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3556
instruct Repl16B_zero(vecX dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3557
  predicate(n->as_Vector()->length() == 16);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3558
  match(Set dst (ReplicateB zero));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3559
  format %{ "pxor    $dst,$dst\t! replicate16B zero" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3560
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3561
    __ pxor($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3562
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3563
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3564
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3565
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3566
instruct Repl32B_zero(vecY dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3567
  predicate(n->as_Vector()->length() == 32);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3568
  match(Set dst (ReplicateB zero));
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3569
  format %{ "vpxor   $dst,$dst,$dst\t! replicate32B zero" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3570
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3571
    // Use vxorpd since AVX does not have vpxor for 256-bit (AVX2 will have it).
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3572
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3573
    __ vpxor($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3574
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3575
  ins_pipe( fpu_reg_reg );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3576
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3577
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3578
// Replicate char/short (2 byte) scalar to be vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3579
instruct Repl2S(vecS dst, rRegI src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3580
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3581
  match(Set dst (ReplicateS src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3582
  format %{ "movd    $dst,$src\n\t"
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3583
            "pshuflw $dst,$dst,0x00\t! replicate2S" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3584
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3585
    __ movdl($dst$$XMMRegister, $src$$Register);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3586
    __ pshuflw($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3587
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3588
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3589
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3590
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3591
// Replicate char/short (2 byte) scalar immediate to be vector by loading from const table.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3592
instruct Repl2S_imm(vecS dst, immI con) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3593
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3594
  match(Set dst (ReplicateS con));
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3595
  format %{ "movdl   $dst,[$constantaddress]\t! replicate2S($con)" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3596
  ins_encode %{
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3597
    __ movdl($dst$$XMMRegister, $constantaddress(replicate4_imm($con$$constant, 2)));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3598
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3599
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3600
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3601
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3602
instruct Repl4S_imm(vecD dst, immI con) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3603
  predicate(n->as_Vector()->length() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3604
  match(Set dst (ReplicateS con));
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3605
  format %{ "movq    $dst,[$constantaddress]\t! replicate4S($con)" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3606
  ins_encode %{
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3607
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 2)));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3608
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3609
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3610
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3611
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3612
// Replicate char/short (2 byte) scalar zero to be vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3613
instruct Repl2S_zero(vecS dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3614
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3615
  match(Set dst (ReplicateS zero));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3616
  format %{ "pxor    $dst,$dst\t! replicate2S zero" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3617
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3618
    __ pxor($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3619
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3620
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3621
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3622
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3623
instruct Repl4S_zero(vecD dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3624
  predicate(n->as_Vector()->length() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3625
  match(Set dst (ReplicateS zero));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3626
  format %{ "pxor    $dst,$dst\t! replicate4S zero" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3627
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3628
    __ pxor($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3629
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3630
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3631
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3632
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3633
instruct Repl8S_zero(vecX dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3634
  predicate(n->as_Vector()->length() == 8);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3635
  match(Set dst (ReplicateS zero));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3636
  format %{ "pxor    $dst,$dst\t! replicate8S zero" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3637
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3638
    __ pxor($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3639
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3640
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3641
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3642
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3643
instruct Repl16S_zero(vecY dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3644
  predicate(n->as_Vector()->length() == 16);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3645
  match(Set dst (ReplicateS zero));
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3646
  format %{ "vpxor   $dst,$dst,$dst\t! replicate16S zero" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3647
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3648
    // Use vxorpd since AVX does not have vpxor for 256-bit (AVX2 will have it).
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3649
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3650
    __ vpxor($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3651
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3652
  ins_pipe( fpu_reg_reg );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3653
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3654
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3655
// Replicate integer (4 byte) scalar to be vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3656
instruct Repl2I(vecD dst, rRegI src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3657
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3658
  match(Set dst (ReplicateI src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3659
  format %{ "movd    $dst,$src\n\t"
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3660
            "pshufd  $dst,$dst,0x00\t! replicate2I" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3661
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3662
    __ movdl($dst$$XMMRegister, $src$$Register);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3663
    __ pshufd($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3664
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3665
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3666
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3667
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3668
// Integer could be loaded into xmm register directly from memory.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3669
instruct Repl2I_mem(vecD dst, memory mem) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3670
  predicate(n->as_Vector()->length() == 2);
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3671
  match(Set dst (ReplicateI (LoadI mem)));
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3672
  format %{ "movd    $dst,$mem\n\t"
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3673
            "pshufd  $dst,$dst,0x00\t! replicate2I" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3674
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3675
    __ movdl($dst$$XMMRegister, $mem$$Address);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3676
    __ pshufd($dst$$XMMRegister, $dst$$XMMRegister, 0x00);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3677
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3678
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3679
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3680
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3681
// Replicate integer (4 byte) scalar immediate to be vector by loading from const table.
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3682
instruct Repl2I_imm(vecD dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3683
  predicate(n->as_Vector()->length() == 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3684
  match(Set dst (ReplicateI con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3685
  format %{ "movq    $dst,[$constantaddress]\t! replicate2I($con)" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3686
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3687
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 4)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3688
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3689
  ins_pipe( fpu_reg_reg );
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3690
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3691
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3692
// Replicate integer (4 byte) scalar zero to be vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3693
instruct Repl2I_zero(vecD dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3694
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3695
  match(Set dst (ReplicateI zero));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3696
  format %{ "pxor    $dst,$dst\t! replicate2I" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3697
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3698
    __ pxor($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3699
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3700
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3701
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3702
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3703
instruct Repl4I_zero(vecX dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3704
  predicate(n->as_Vector()->length() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3705
  match(Set dst (ReplicateI zero));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3706
  format %{ "pxor    $dst,$dst\t! replicate4I zero)" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3707
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3708
    __ pxor($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3709
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3710
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3711
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3712
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3713
instruct Repl8I_zero(vecY dst, immI0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3714
  predicate(n->as_Vector()->length() == 8);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3715
  match(Set dst (ReplicateI zero));
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3716
  format %{ "vpxor   $dst,$dst,$dst\t! replicate8I zero" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3717
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3718
    // Use vxorpd since AVX does not have vpxor for 256-bit (AVX2 will have it).
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3719
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3720
    __ vpxor($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3721
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3722
  ins_pipe( fpu_reg_reg );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3723
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3724
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3725
// Replicate long (8 byte) scalar to be vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3726
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3727
instruct Repl2L(vecX dst, rRegL src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3728
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3729
  match(Set dst (ReplicateL src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3730
  format %{ "movdq   $dst,$src\n\t"
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3731
            "punpcklqdq $dst,$dst\t! replicate2L" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3732
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3733
    __ movdq($dst$$XMMRegister, $src$$Register);
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3734
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3735
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3736
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3737
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3738
#else // _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3739
instruct Repl2L(vecX dst, eRegL src, regD tmp) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3740
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3741
  match(Set dst (ReplicateL src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3742
  effect(TEMP dst, USE src, TEMP tmp);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3743
  format %{ "movdl   $dst,$src.lo\n\t"
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3744
            "movdl   $tmp,$src.hi\n\t"
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3745
            "punpckldq $dst,$tmp\n\t"
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3746
            "punpcklqdq $dst,$dst\t! replicate2L"%}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3747
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3748
    __ movdl($dst$$XMMRegister, $src$$Register);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3749
    __ movdl($tmp$$XMMRegister, HIGH_FROM_LOW($src$$Register));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3750
    __ punpckldq($dst$$XMMRegister, $tmp$$XMMRegister);
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3751
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3752
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3753
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3754
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3755
#endif // _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3756
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3757
// Replicate long (8 byte) scalar immediate to be vector by loading from const table.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3758
instruct Repl2L_imm(vecX dst, immL con) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3759
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3760
  match(Set dst (ReplicateL con));
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3761
  format %{ "movq    $dst,[$constantaddress]\n\t"
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3762
            "punpcklqdq $dst,$dst\t! replicate2L($con)" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3763
  ins_encode %{
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3764
    __ movq($dst$$XMMRegister, $constantaddress($con));
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3765
    __ punpcklqdq($dst$$XMMRegister, $dst$$XMMRegister);
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3766
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3767
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3768
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3769
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3770
// Replicate long (8 byte) scalar zero to be vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3771
instruct Repl2L_zero(vecX dst, immL0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3772
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3773
  match(Set dst (ReplicateL zero));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3774
  format %{ "pxor    $dst,$dst\t! replicate2L zero" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3775
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3776
    __ pxor($dst$$XMMRegister, $dst$$XMMRegister);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3777
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3778
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3779
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3780
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3781
instruct Repl4L_zero(vecY dst, immL0 zero) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3782
  predicate(n->as_Vector()->length() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3783
  match(Set dst (ReplicateL zero));
13294
80131b419f85 7181494: cleanup avx and vectors code
kvn
parents: 13108
diff changeset
  3784
  format %{ "vpxor   $dst,$dst,$dst\t! replicate4L zero" %}
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3785
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3786
    // Use vxorpd since AVX does not have vpxor for 256-bit (AVX2 will have it).
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3787
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3788
    __ vpxor($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3789
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3790
  ins_pipe( fpu_reg_reg );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3791
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  3792
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3793
// Replicate float (4 byte) scalar to be vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3794
instruct Repl2F(vecD dst, regF src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3795
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3796
  match(Set dst (ReplicateF src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3797
  format %{ "pshufd  $dst,$dst,0x00\t! replicate2F" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3798
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3799
    __ pshufd($dst$$XMMRegister, $src$$XMMRegister, 0x00);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3800
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3801
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3802
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3803
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3804
instruct Repl4F(vecX dst, regF src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3805
  predicate(n->as_Vector()->length() == 4);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3806
  match(Set dst (ReplicateF src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3807
  format %{ "pshufd  $dst,$dst,0x00\t! replicate4F" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3808
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3809
    __ pshufd($dst$$XMMRegister, $src$$XMMRegister, 0x00);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3810
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3811
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3812
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3813
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3814
// Replicate double (8 bytes) scalar to be vector
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3815
instruct Repl2D(vecX dst, regD src) %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3816
  predicate(n->as_Vector()->length() == 2);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3817
  match(Set dst (ReplicateD src));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3818
  format %{ "pshufd  $dst,$src,0x44\t! replicate2D" %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3819
  ins_encode %{
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3820
    __ pshufd($dst$$XMMRegister, $src$$XMMRegister, 0x44);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3821
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3822
  ins_pipe( pipe_slow );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3823
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  3824
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3825
// ====================EVEX REPLICATE=============================================
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3826
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3827
instruct Repl4B_mem_evex(vecS dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3828
  predicate(n->as_Vector()->length() == 4 && VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3829
  match(Set dst (ReplicateB (LoadB mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3830
  format %{ "vpbroadcastb  $dst,$mem\t! replicate4B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3831
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3832
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3833
    __ evpbroadcastb($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3834
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3835
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3836
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3837
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3838
instruct Repl8B_mem_evex(vecD dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3839
  predicate(n->as_Vector()->length() == 8 && VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3840
  match(Set dst (ReplicateB (LoadB mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3841
  format %{ "vpbroadcastb  $dst,$mem\t! replicate8B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3842
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3843
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3844
    __ evpbroadcastb($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3845
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3846
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3847
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3848
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3849
instruct Repl16B_evex(vecX dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3850
  predicate(n->as_Vector()->length() == 16 && VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3851
  match(Set dst (ReplicateB src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3852
  format %{ "vpbroadcastb $dst,$src\t! replicate16B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3853
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3854
   int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3855
    __ evpbroadcastb($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3856
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3857
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3858
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3859
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3860
instruct Repl16B_mem_evex(vecX dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3861
  predicate(n->as_Vector()->length() == 16 && VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3862
  match(Set dst (ReplicateB (LoadB mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3863
  format %{ "vpbroadcastb  $dst,$mem\t! replicate16B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3864
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3865
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3866
    __ evpbroadcastb($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3867
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3868
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3869
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3870
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3871
instruct Repl32B_evex(vecY dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3872
  predicate(n->as_Vector()->length() == 32 && VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3873
  match(Set dst (ReplicateB src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3874
  format %{ "vpbroadcastb $dst,$src\t! replicate32B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3875
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3876
   int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3877
    __ evpbroadcastb($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3878
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3879
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3880
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3881
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3882
instruct Repl32B_mem_evex(vecY dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3883
  predicate(n->as_Vector()->length() == 32 && VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3884
  match(Set dst (ReplicateB (LoadB mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3885
  format %{ "vpbroadcastb  $dst,$mem\t! replicate32B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3886
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3887
    int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3888
    __ evpbroadcastb($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3889
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3890
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3891
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3892
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3893
instruct Repl64B_evex(vecZ dst, rRegI src) %{
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3894
  predicate(n->as_Vector()->length() == 64 && VM_Version::supports_avx512bw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3895
  match(Set dst (ReplicateB src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3896
  format %{ "vpbroadcastb $dst,$src\t! upper replicate64B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3897
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3898
   int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3899
    __ evpbroadcastb($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3900
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3901
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3902
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3903
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3904
instruct Repl64B_mem_evex(vecZ dst, memory mem) %{
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3905
  predicate(n->as_Vector()->length() == 64 && VM_Version::supports_avx512bw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3906
  match(Set dst (ReplicateB (LoadB mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3907
  format %{ "vpbroadcastb  $dst,$mem\t! replicate64B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3908
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3909
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3910
    __ evpbroadcastb($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3911
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3912
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3913
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3914
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3915
instruct Repl16B_imm_evex(vecX dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3916
  predicate(n->as_Vector()->length() == 16 && VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3917
  match(Set dst (ReplicateB con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3918
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3919
            "vpbroadcastb $dst,$dst\t! replicate16B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3920
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3921
   int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3922
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 1)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3923
    __ evpbroadcastb($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3924
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3925
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3926
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3927
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3928
instruct Repl32B_imm_evex(vecY dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3929
  predicate(n->as_Vector()->length() == 32 && VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3930
  match(Set dst (ReplicateB con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3931
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3932
            "vpbroadcastb $dst,$dst\t! replicate32B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3933
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3934
   int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3935
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 1)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3936
    __ evpbroadcastb($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3937
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3938
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3939
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3940
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3941
instruct Repl64B_imm_evex(vecZ dst, immI con) %{
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  3942
  predicate(n->as_Vector()->length() == 64 && VM_Version::supports_avx512bw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3943
  match(Set dst (ReplicateB con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3944
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3945
            "vpbroadcastb $dst,$dst\t! upper replicate64B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3946
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3947
   int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3948
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 1)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3949
    __ evpbroadcastb($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3950
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3951
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3952
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3953
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3954
instruct Repl64B_zero_evex(vecZ dst, immI0 zero) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3955
  predicate(n->as_Vector()->length() == 64 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3956
  match(Set dst (ReplicateB zero));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3957
  format %{ "vpxor   $dst k0,$dst,$dst\t! replicate64B zero" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3958
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3959
    // Use vxorpd since AVX does not have vpxor for 512-bit (EVEX will have it).
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3960
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3961
    __ vpxor($dst$$XMMRegister,$dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3962
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3963
  ins_pipe( fpu_reg_reg );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3964
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3965
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3966
instruct Repl4S_evex(vecD dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3967
  predicate(n->as_Vector()->length() == 4 && VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3968
  match(Set dst (ReplicateS src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3969
  format %{ "vpbroadcastw $dst,$src\t! replicate4S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3970
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3971
   int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3972
    __ evpbroadcastw($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3973
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3974
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3975
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3976
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3977
instruct Repl4S_mem_evex(vecD dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3978
  predicate(n->as_Vector()->length() == 4 && VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3979
  match(Set dst (ReplicateS (LoadS mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3980
  format %{ "vpbroadcastw  $dst,$mem\t! replicate4S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3981
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3982
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3983
    __ evpbroadcastw($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3984
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3985
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3986
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3987
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3988
instruct Repl8S_evex(vecX dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3989
  predicate(n->as_Vector()->length() == 8 && VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3990
  match(Set dst (ReplicateS src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3991
  format %{ "vpbroadcastw $dst,$src\t! replicate8S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3992
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3993
   int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3994
    __ evpbroadcastw($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3995
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3996
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3997
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3998
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  3999
instruct Repl8S_mem_evex(vecX dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4000
  predicate(n->as_Vector()->length() == 8 && VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4001
  match(Set dst (ReplicateS (LoadS mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4002
  format %{ "vpbroadcastw  $dst,$mem\t! replicate8S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4003
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4004
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4005
    __ evpbroadcastw($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4006
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4007
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4008
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4009
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4010
instruct Repl16S_evex(vecY dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4011
  predicate(n->as_Vector()->length() == 16 && VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4012
  match(Set dst (ReplicateS src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4013
  format %{ "vpbroadcastw $dst,$src\t! replicate16S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4014
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4015
   int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4016
    __ evpbroadcastw($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4017
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4018
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4019
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4020
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4021
instruct Repl16S_mem_evex(vecY dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4022
  predicate(n->as_Vector()->length() == 16 && VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4023
  match(Set dst (ReplicateS (LoadS mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4024
  format %{ "vpbroadcastw  $dst,$mem\t! replicate16S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4025
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4026
    int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4027
    __ evpbroadcastw($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4028
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4029
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4030
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4031
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4032
instruct Repl32S_evex(vecZ dst, rRegI src) %{
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4033
  predicate(n->as_Vector()->length() == 32 && VM_Version::supports_avx512bw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4034
  match(Set dst (ReplicateS src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4035
  format %{ "vpbroadcastw $dst,$src\t! replicate32S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4036
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4037
   int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4038
    __ evpbroadcastw($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4039
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4040
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4041
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4042
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4043
instruct Repl32S_mem_evex(vecZ dst, memory mem) %{
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4044
  predicate(n->as_Vector()->length() == 32 && VM_Version::supports_avx512bw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4045
  match(Set dst (ReplicateS (LoadS mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4046
  format %{ "vpbroadcastw  $dst,$mem\t! replicate32S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4047
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4048
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4049
    __ evpbroadcastw($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4050
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4051
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4052
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4053
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4054
instruct Repl8S_imm_evex(vecX dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4055
  predicate(n->as_Vector()->length() == 8 && VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4056
  match(Set dst (ReplicateS con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4057
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4058
            "vpbroadcastw $dst,$dst\t! replicate8S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4059
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4060
   int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4061
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 2)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4062
    __ evpbroadcastw($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4063
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4064
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4065
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4066
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4067
instruct Repl16S_imm_evex(vecY dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4068
  predicate(n->as_Vector()->length() == 16 && VM_Version::supports_avx512vlbw());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4069
  match(Set dst (ReplicateS con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4070
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4071
            "vpbroadcastw $dst,$dst\t! replicate16S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4072
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4073
   int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4074
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 2)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4075
    __ evpbroadcastw($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4076
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4077
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4078
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4079
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4080
instruct Repl32S_imm_evex(vecZ dst, immI con) %{
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4081
  predicate(n->as_Vector()->length() == 32 && VM_Version::supports_avx512bw());
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4082
  match(Set dst (ReplicateS con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4083
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4084
            "vpbroadcastw $dst,$dst\t! replicate32S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4085
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4086
   int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4087
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 2)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4088
    __ evpbroadcastw($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4089
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4090
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4091
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4092
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4093
instruct Repl32S_zero_evex(vecZ dst, immI0 zero) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4094
  predicate(n->as_Vector()->length() == 32 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4095
  match(Set dst (ReplicateS zero));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4096
  format %{ "vpxor   $dst k0,$dst,$dst\t! replicate32S zero" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4097
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4098
    // Use vxorpd since AVX does not have vpxor for 512-bit (EVEX will have it).
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4099
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4100
    __ vpxor($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4101
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4102
  ins_pipe( fpu_reg_reg );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4103
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4104
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4105
instruct Repl4I_evex(vecX dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4106
  predicate(n->as_Vector()->length() == 4 && VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4107
  match(Set dst (ReplicateI src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4108
  format %{ "vpbroadcastd  $dst,$src\t! replicate4I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4109
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4110
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4111
    __ evpbroadcastd($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4112
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4113
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4114
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4115
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4116
instruct Repl4I_mem_evex(vecX dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4117
  predicate(n->as_Vector()->length() == 4 && VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4118
  match(Set dst (ReplicateI (LoadI mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4119
  format %{ "vpbroadcastd  $dst,$mem\t! replicate4I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4120
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4121
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4122
    __ evpbroadcastd($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4123
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4124
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4125
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4126
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4127
instruct Repl8I_evex(vecY dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4128
  predicate(n->as_Vector()->length() == 8 && VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4129
  match(Set dst (ReplicateI src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4130
  format %{ "vpbroadcastd  $dst,$src\t! replicate8I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4131
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4132
    int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4133
    __ evpbroadcastd($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4134
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4135
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4136
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4137
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4138
instruct Repl8I_mem_evex(vecY dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4139
  predicate(n->as_Vector()->length() == 8 && VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4140
  match(Set dst (ReplicateI (LoadI mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4141
  format %{ "vpbroadcastd  $dst,$mem\t! replicate8I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4142
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4143
    int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4144
    __ evpbroadcastd($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4145
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4146
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4147
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4148
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4149
instruct Repl16I_evex(vecZ dst, rRegI src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4150
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4151
  match(Set dst (ReplicateI src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4152
  format %{ "vpbroadcastd  $dst,$src\t! replicate16I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4153
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4154
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4155
    __ evpbroadcastd($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4156
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4157
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4158
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4159
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4160
instruct Repl16I_mem_evex(vecZ dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4161
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4162
  match(Set dst (ReplicateI (LoadI mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4163
  format %{ "vpbroadcastd  $dst,$mem\t! replicate16I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4164
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4165
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4166
    __ evpbroadcastd($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4167
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4168
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4169
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4170
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4171
instruct Repl4I_imm_evex(vecX dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4172
  predicate(n->as_Vector()->length() == 4 && VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4173
  match(Set dst (ReplicateI con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4174
  format %{ "movq    $dst,[$constantaddress]\t! replicate8I($con)\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4175
            "vpbroadcastd  $dst,$dst\t! replicate4I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4176
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4177
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4178
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 4)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4179
    __ evpbroadcastd($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4180
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4181
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4182
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4183
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4184
instruct Repl8I_imm_evex(vecY dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4185
  predicate(n->as_Vector()->length() == 8 && VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4186
  match(Set dst (ReplicateI con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4187
  format %{ "movq    $dst,[$constantaddress]\t! replicate8I($con)\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4188
            "vpbroadcastd  $dst,$dst\t! replicate8I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4189
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4190
    int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4191
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 4)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4192
    __ evpbroadcastd($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4193
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4194
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4195
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4196
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4197
instruct Repl16I_imm_evex(vecZ dst, immI con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4198
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4199
  match(Set dst (ReplicateI con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4200
  format %{ "movq    $dst,[$constantaddress]\t! replicate16I($con)\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4201
            "vpbroadcastd  $dst,$dst\t! replicate16I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4202
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4203
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4204
    __ movq($dst$$XMMRegister, $constantaddress(replicate8_imm($con$$constant, 4)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4205
    __ evpbroadcastd($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4206
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4207
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4208
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4209
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4210
instruct Repl16I_zero_evex(vecZ dst, immI0 zero) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4211
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4212
  match(Set dst (ReplicateI zero));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4213
  format %{ "vpxor   $dst k0,$dst,$dst\t! replicate16I zero" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4214
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4215
    // Use vxorpd since AVX does not have vpxor for 512-bit (AVX2 will have it).
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4216
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4217
    __ vpxor($dst$$XMMRegister, $dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4218
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4219
  ins_pipe( fpu_reg_reg );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4220
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4221
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4222
// Replicate long (8 byte) scalar to be vector
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4223
#ifdef _LP64
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4224
instruct Repl4L_evex(vecY dst, rRegL src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4225
  predicate(n->as_Vector()->length() == 4 && VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4226
  match(Set dst (ReplicateL src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4227
  format %{ "vpbroadcastq  $dst,$src\t! replicate4L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4228
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4229
    int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4230
    __ evpbroadcastq($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4231
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4232
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4233
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4234
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4235
instruct Repl8L_evex(vecZ dst, rRegL src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4236
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4237
  match(Set dst (ReplicateL src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4238
  format %{ "vpbroadcastq  $dst,$src\t! replicate8L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4239
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4240
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4241
    __ evpbroadcastq($dst$$XMMRegister, $src$$Register, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4242
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4243
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4244
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4245
#else // _LP64
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4246
instruct Repl4L_evex(vecY dst, eRegL src, regD tmp) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4247
  predicate(n->as_Vector()->length() == 4 && VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4248
  match(Set dst (ReplicateL src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4249
  effect(TEMP dst, USE src, TEMP tmp);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4250
  format %{ "movdl   $dst,$src.lo\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4251
            "movdl   $tmp,$src.hi\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4252
            "punpckldq $dst,$tmp\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4253
            "vpbroadcastq  $dst,$dst\t! replicate4L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4254
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4255
    int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4256
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4257
    __ movdl($tmp$$XMMRegister, HIGH_FROM_LOW($src$$Register));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4258
    __ punpckldq($dst$$XMMRegister, $tmp$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4259
    __ evpbroadcastq($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4260
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4261
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4262
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4263
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4264
instruct Repl8L_evex(vecZ dst, eRegL src, regD tmp) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4265
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4266
  match(Set dst (ReplicateL src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4267
  effect(TEMP dst, USE src, TEMP tmp);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4268
  format %{ "movdl   $dst,$src.lo\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4269
            "movdl   $tmp,$src.hi\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4270
            "punpckldq $dst,$tmp\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4271
            "vpbroadcastq  $dst,$dst\t! replicate8L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4272
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4273
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4274
    __ movdl($dst$$XMMRegister, $src$$Register);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4275
    __ movdl($tmp$$XMMRegister, HIGH_FROM_LOW($src$$Register));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4276
    __ punpckldq($dst$$XMMRegister, $tmp$$XMMRegister);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4277
    __ evpbroadcastq($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4278
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4279
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4280
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4281
#endif // _LP64
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4282
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4283
instruct Repl4L_imm_evex(vecY dst, immL con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4284
  predicate(n->as_Vector()->length() == 4 && VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4285
  match(Set dst (ReplicateL con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4286
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4287
            "vpbroadcastq  $dst,$dst\t! replicate4L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4288
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4289
    int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4290
    __ movq($dst$$XMMRegister, $constantaddress($con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4291
    __ evpbroadcastq($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4292
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4293
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4294
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4295
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4296
instruct Repl8L_imm_evex(vecZ dst, immL con) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4297
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4298
  match(Set dst (ReplicateL con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4299
  format %{ "movq    $dst,[$constantaddress]\n\t"
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4300
            "vpbroadcastq  $dst,$dst\t! replicate8L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4301
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4302
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4303
    __ movq($dst$$XMMRegister, $constantaddress($con));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4304
    __ evpbroadcastq($dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4305
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4306
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4307
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4308
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4309
instruct Repl2L_mem_evex(vecX dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4310
  predicate(n->as_Vector()->length() == 2 && VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4311
  match(Set dst (ReplicateL (LoadL mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4312
  format %{ "vpbroadcastd  $dst,$mem\t! replicate2L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4313
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4314
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4315
    __ evpbroadcastq($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4316
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4317
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4318
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4319
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4320
instruct Repl4L_mem_evex(vecY dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4321
  predicate(n->as_Vector()->length() == 4 && VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4322
  match(Set dst (ReplicateL (LoadL mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4323
  format %{ "vpbroadcastd  $dst,$mem\t! replicate4L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4324
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4325
    int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4326
    __ evpbroadcastq($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4327
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4328
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4329
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4330
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4331
instruct Repl8L_mem_evex(vecZ dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4332
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4333
  match(Set dst (ReplicateL (LoadL mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4334
  format %{ "vpbroadcastd  $dst,$mem\t! replicate8L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4335
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4336
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4337
    __ evpbroadcastq($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4338
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4339
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4340
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4341
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4342
instruct Repl8L_zero_evex(vecZ dst, immL0 zero) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4343
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4344
  match(Set dst (ReplicateL zero));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4345
  format %{ "vpxor   $dst k0,$dst,$dst\t! replicate8L zero" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4346
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4347
    // Use vxorpd since AVX does not have vpxor for 512-bit (EVEX will have it).
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4348
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4349
    __ vpxor($dst$$XMMRegister,$dst$$XMMRegister, $dst$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4350
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4351
  ins_pipe( fpu_reg_reg );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4352
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4353
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4354
instruct Repl8F_evex(vecY dst, regF src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4355
  predicate(n->as_Vector()->length() == 8 && VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4356
  match(Set dst (ReplicateF src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4357
  format %{ "vbroadcastss $dst,$src\t! replicate8F" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4358
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4359
    int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4360
    __ evpbroadcastss($dst$$XMMRegister, $src$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4361
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4362
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4363
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4364
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4365
instruct Repl8F_mem_evex(vecY dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4366
  predicate(n->as_Vector()->length() == 8 && VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4367
  match(Set dst (ReplicateF (LoadF mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4368
  format %{ "vbroadcastss  $dst,$mem\t! replicate8F" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4369
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4370
    int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4371
    __ evpbroadcastss($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4372
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4373
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4374
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4375
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4376
instruct Repl16F_evex(vecZ dst, regF src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4377
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4378
  match(Set dst (ReplicateF src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4379
  format %{ "vbroadcastss $dst,$src\t! replicate16F" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4380
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4381
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4382
    __ evpbroadcastss($dst$$XMMRegister, $src$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4383
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4384
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4385
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4386
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4387
instruct Repl16F_mem_evex(vecZ dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4388
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4389
  match(Set dst (ReplicateF (LoadF mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4390
  format %{ "vbroadcastss  $dst,$mem\t! replicate16F" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4391
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4392
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4393
    __ evpbroadcastss($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4394
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4395
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4396
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4397
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4398
instruct Repl2F_zero_evex(vecD dst, immF0 zero) %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4399
  predicate(n->as_Vector()->length() == 2 && UseAVX > 2);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4400
  match(Set dst (ReplicateF zero));
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4401
  format %{ "vpxor  $dst k0,$dst,$dst\t! replicate2F zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4402
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4403
    // Use vpxor in place of vxorps since EVEX has a constriant on dq for vxorps: this is a 512-bit operation
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4404
    int vector_len = 2;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4405
    __ vpxor($dst$$XMMRegister,$dst$$XMMRegister, $dst$$XMMRegister, vector_len);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4406
  %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4407
  ins_pipe( fpu_reg_reg );
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4408
%}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4409
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4410
instruct Repl4F_zero_evex(vecX dst, immF0 zero) %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4411
  predicate(n->as_Vector()->length() == 4 && UseAVX > 2);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4412
  match(Set dst (ReplicateF zero));
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4413
  format %{ "vpxor  $dst k0,$dst,$dst\t! replicate4F zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4414
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4415
    // Use vpxor in place of vxorps since EVEX has a constriant on dq for vxorps: this is a 512-bit operation
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4416
    int vector_len = 2;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4417
    __ vpxor($dst$$XMMRegister,$dst$$XMMRegister, $dst$$XMMRegister, vector_len);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4418
  %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4419
  ins_pipe( fpu_reg_reg );
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4420
%}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4421
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4422
instruct Repl8F_zero_evex(vecY dst, immF0 zero) %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4423
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4424
  match(Set dst (ReplicateF zero));
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4425
  format %{ "vpxor  $dst k0,$dst,$dst\t! replicate8F zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4426
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4427
    // Use vpxor in place of vxorps since EVEX has a constriant on dq for vxorps: this is a 512-bit operation
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4428
    int vector_len = 2;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4429
    __ vpxor($dst$$XMMRegister,$dst$$XMMRegister, $dst$$XMMRegister, vector_len);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4430
  %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4431
  ins_pipe( fpu_reg_reg );
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4432
%}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4433
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4434
instruct Repl16F_zero_evex(vecZ dst, immF0 zero) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4435
  predicate(n->as_Vector()->length() == 16 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4436
  match(Set dst (ReplicateF zero));
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4437
  format %{ "vpxor  $dst k0,$dst,$dst\t! replicate16F zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4438
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4439
    // Use vpxor in place of vxorps since EVEX has a constriant on dq for vxorps: this is a 512-bit operation
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4440
    int vector_len = 2;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4441
    __ vpxor($dst$$XMMRegister,$dst$$XMMRegister, $dst$$XMMRegister, vector_len);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4442
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4443
  ins_pipe( fpu_reg_reg );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4444
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4445
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4446
instruct Repl4D_evex(vecY dst, regD src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4447
  predicate(n->as_Vector()->length() == 4 && VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4448
  match(Set dst (ReplicateD src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4449
  format %{ "vbroadcastsd $dst,$src\t! replicate4D" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4450
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4451
    int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4452
    __ evpbroadcastsd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4453
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4454
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4455
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4456
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4457
instruct Repl4D_mem_evex(vecY dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4458
  predicate(n->as_Vector()->length() == 4 && VM_Version::supports_avx512vl());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4459
  match(Set dst (ReplicateD (LoadD mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4460
  format %{ "vbroadcastsd  $dst,$mem\t! replicate4D" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4461
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4462
    int vector_len = 1;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4463
    __ evpbroadcastsd($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4464
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4465
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4466
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4467
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4468
instruct Repl8D_evex(vecZ dst, regD src) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4469
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4470
  match(Set dst (ReplicateD src));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4471
  format %{ "vbroadcastsd $dst,$src\t! replicate8D" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4472
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4473
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4474
    __ evpbroadcastsd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4475
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4476
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4477
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4478
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4479
instruct Repl8D_mem_evex(vecZ dst, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4480
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4481
  match(Set dst (ReplicateD (LoadD mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4482
  format %{ "vbroadcastsd  $dst,$mem\t! replicate8D" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4483
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4484
    int vector_len = 2;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4485
    __ evpbroadcastsd($dst$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4486
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4487
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4488
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4489
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4490
instruct Repl2D_zero_evex(vecX dst, immD0 zero) %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4491
  predicate(n->as_Vector()->length() == 2 && UseAVX > 2);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4492
  match(Set dst (ReplicateD zero));
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4493
  format %{ "vpxor  $dst k0,$dst,$dst\t! replicate2D zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4494
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4495
    // Use vpxor in place of vxorpd since EVEX has a constriant on dq for vxorpd: this is a 512-bit operation
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4496
    int vector_len = 2;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4497
    __ vpxor($dst$$XMMRegister,$dst$$XMMRegister, $dst$$XMMRegister, vector_len);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4498
  %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4499
  ins_pipe( fpu_reg_reg );
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4500
%}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4501
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4502
instruct Repl4D_zero_evex(vecY dst, immD0 zero) %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4503
  predicate(n->as_Vector()->length() == 4 && UseAVX > 2);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4504
  match(Set dst (ReplicateD zero));
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4505
  format %{ "vpxor  $dst k0,$dst,$dst\t! replicate4D zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4506
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4507
    // Use vpxor in place of vxorpd since EVEX has a constriant on dq for vxorpd: this is a 512-bit operation
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4508
    int vector_len = 2;
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4509
    __ vpxor($dst$$XMMRegister,$dst$$XMMRegister, $dst$$XMMRegister, vector_len);
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4510
  %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4511
  ins_pipe( fpu_reg_reg );
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4512
%}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4513
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4514
instruct Repl8D_zero_evex(vecZ dst, immD0 zero) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  4515
  predicate(n->as_Vector()->length() == 8 && UseAVX > 2);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4516
  match(Set dst (ReplicateD zero));
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4517
  format %{ "vpxor  $dst k0,$dst,$dst,vect512\t! replicate8D zero" %}
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4518
  ins_encode %{
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4519
    // Use vpxor in place of vxorpd since EVEX has a constriant on dq for vxorpd: this is a 512-bit operation
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4520
    int vector_len = 2;
32727
320855c2baef 8132160: support for AVX 512 call frames and stack management
mcberg
parents: 32723
diff changeset
  4521
    __ vpxor($dst$$XMMRegister,$dst$$XMMRegister, $dst$$XMMRegister, vector_len);
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4522
  %}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4523
  ins_pipe( fpu_reg_reg );
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4524
%}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11794
diff changeset
  4525
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4526
// ====================REDUCTION ARITHMETIC=======================================
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4527
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4528
instruct rsadd2I_reduction_reg(rRegI dst, rRegI src1, vecD src2, regF tmp, regF tmp2) %{
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4529
  predicate(UseSSE > 2 && UseAVX == 0);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4530
  match(Set dst (AddReductionVI src1 src2));
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4531
  effect(TEMP tmp2, TEMP tmp);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4532
  format %{ "movdqu  $tmp2,$src2\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4533
            "phaddd  $tmp2,$tmp2\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4534
            "movd    $tmp,$src1\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4535
            "paddd   $tmp,$tmp2\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4536
            "movd    $dst,$tmp\t! add reduction2I" %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4537
  ins_encode %{
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4538
    __ movdqu($tmp2$$XMMRegister, $src2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4539
    __ phaddd($tmp2$$XMMRegister, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4540
    __ movdl($tmp$$XMMRegister, $src1$$Register);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4541
    __ paddd($tmp$$XMMRegister, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4542
    __ movdl($dst$$Register, $tmp$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4543
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4544
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4545
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4546
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4547
instruct rvadd2I_reduction_reg(rRegI dst, rRegI src1, vecD src2, regF tmp, regF tmp2) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4548
  predicate(VM_Version::supports_avxonly());
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4549
  match(Set dst (AddReductionVI src1 src2));
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4550
  effect(TEMP tmp, TEMP tmp2);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4551
  format %{ "vphaddd  $tmp,$src2,$src2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4552
            "movd     $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4553
            "vpaddd   $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4554
            "movd     $dst,$tmp2\t! add reduction2I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4555
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4556
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4557
    __ vphaddd($tmp$$XMMRegister, $src2$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4558
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4559
    __ vpaddd($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4560
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4561
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4562
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4563
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4564
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4565
instruct rvadd2I_reduction_reg_evex(rRegI dst, rRegI src1, vecD src2, regF tmp, regF tmp2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4566
  predicate(UseAVX > 2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4567
  match(Set dst (AddReductionVI src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4568
  effect(TEMP tmp, TEMP tmp2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4569
  format %{ "pshufd  $tmp2,$src2,0x1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4570
            "vpaddd  $tmp,$src2,$tmp2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4571
            "movd    $tmp2,$src1\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4572
            "vpaddd  $tmp2,$tmp,$tmp2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4573
            "movd    $dst,$tmp2\t! add reduction2I" %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4574
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4575
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4576
    __ pshufd($tmp2$$XMMRegister, $src2$$XMMRegister, 0x1);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4577
    __ vpaddd($tmp$$XMMRegister, $src2$$XMMRegister, $tmp2$$XMMRegister, vector_len);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4578
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4579
    __ vpaddd($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4580
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4581
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4582
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4583
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4584
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4585
instruct rsadd4I_reduction_reg(rRegI dst, rRegI src1, vecX src2, regF tmp, regF tmp2) %{
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4586
  predicate(UseSSE > 2 && UseAVX == 0);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4587
  match(Set dst (AddReductionVI src1 src2));
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4588
  effect(TEMP tmp, TEMP tmp2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4589
  format %{ "movdqu  $tmp,$src2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4590
            "phaddd  $tmp,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4591
            "phaddd  $tmp,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4592
            "movd    $tmp2,$src1\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4593
            "paddd   $tmp2,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4594
            "movd    $dst,$tmp2\t! add reduction4I" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4595
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4596
    __ movdqu($tmp$$XMMRegister, $src2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4597
    __ phaddd($tmp$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4598
    __ phaddd($tmp$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4599
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4600
    __ paddd($tmp2$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4601
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4602
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4603
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4604
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4605
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4606
instruct rvadd4I_reduction_reg(rRegI dst, rRegI src1, vecX src2, regF tmp, regF tmp2) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4607
  predicate(VM_Version::supports_avxonly());
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4608
  match(Set dst (AddReductionVI src1 src2));
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4609
  effect(TEMP tmp, TEMP tmp2);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4610
  format %{ "vphaddd  $tmp,$src2,$src2\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4611
            "vphaddd  $tmp,$tmp,$tmp\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4612
            "movd     $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4613
            "vpaddd   $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4614
            "movd     $dst,$tmp2\t! add reduction4I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4615
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4616
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4617
    __ vphaddd($tmp$$XMMRegister, $src2$$XMMRegister, $src2$$XMMRegister, vector_len);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4618
    __ vphaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp$$XMMRegister, vector_len);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4619
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4620
    __ vpaddd($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4621
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4622
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4623
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4624
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4625
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4626
instruct rvadd4I_reduction_reg_evex(rRegI dst, rRegI src1, vecX src2, regF tmp, regF tmp2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4627
  predicate(UseAVX > 2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4628
  match(Set dst (AddReductionVI src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4629
  effect(TEMP tmp, TEMP tmp2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4630
  format %{ "pshufd  $tmp2,$src2,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4631
            "vpaddd  $tmp,$src2,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4632
            "pshufd  $tmp2,$tmp,0x1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4633
            "vpaddd  $tmp,$tmp,$tmp2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4634
            "movd    $tmp2,$src1\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4635
            "vpaddd  $tmp2,$tmp,$tmp2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4636
            "movd    $dst,$tmp2\t! add reduction4I" %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4637
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4638
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4639
    __ pshufd($tmp2$$XMMRegister, $src2$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4640
    __ vpaddd($tmp$$XMMRegister, $src2$$XMMRegister, $tmp2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4641
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0x1);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4642
    __ vpaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4643
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4644
    __ vpaddd($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4645
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4646
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4647
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4648
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4649
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4650
instruct rvadd8I_reduction_reg(rRegI dst, rRegI src1, vecY src2, regF tmp, regF tmp2) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4651
  predicate(VM_Version::supports_avxonly());
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4652
  match(Set dst (AddReductionVI src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4653
  effect(TEMP tmp, TEMP tmp2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4654
  format %{ "vphaddd  $tmp,$src2,$src2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4655
            "vphaddd  $tmp,$tmp,$tmp2\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4656
            "vextracti128_high  $tmp2,$tmp\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4657
            "vpaddd   $tmp,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4658
            "movd     $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4659
            "vpaddd   $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4660
            "movd     $dst,$tmp2\t! add reduction8I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4661
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4662
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4663
    __ vphaddd($tmp$$XMMRegister, $src2$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4664
    __ vphaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4665
    __ vextracti128_high($tmp2$$XMMRegister, $tmp$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4666
    __ vpaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4667
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4668
    __ vpaddd($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4669
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4670
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4671
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4672
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4673
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4674
instruct rvadd8I_reduction_reg_evex(rRegI dst, rRegI src1, vecY src2, regF tmp, regF tmp2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4675
  predicate(UseAVX > 2);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4676
  match(Set dst (AddReductionVI src1 src2));
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4677
  effect(TEMP tmp, TEMP tmp2);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4678
  format %{ "vextracti128_high  $tmp,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4679
            "vpaddd  $tmp,$tmp,$src2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4680
            "pshufd  $tmp2,$tmp,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4681
            "vpaddd  $tmp,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4682
            "pshufd  $tmp2,$tmp,0x1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4683
            "vpaddd  $tmp,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4684
            "movd    $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4685
            "vpaddd  $tmp2,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4686
            "movd    $dst,$tmp2\t! add reduction8I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4687
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4688
    int vector_len = 0;
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4689
    __ vextracti128_high($tmp$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4690
    __ vpaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4691
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4692
    __ vpaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4693
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0x1);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4694
    __ vpaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4695
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4696
    __ vpaddd($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4697
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4698
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4699
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4700
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4701
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4702
instruct rvadd16I_reduction_reg_evex(rRegI dst, rRegI src1, vecZ src2, regF tmp, regF tmp2, regF tmp3) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4703
  predicate(UseAVX > 2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4704
  match(Set dst (AddReductionVI src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4705
  effect(TEMP tmp, TEMP tmp2, TEMP tmp3);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4706
  format %{ "vextracti64x4_high  $tmp3,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4707
            "vpaddd  $tmp3,$tmp3,$src2\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4708
            "vextracti128_high  $tmp,$tmp3\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4709
            "vpaddd  $tmp,$tmp,$tmp3\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4710
            "pshufd  $tmp2,$tmp,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4711
            "vpaddd  $tmp,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4712
            "pshufd  $tmp2,$tmp,0x1\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4713
            "vpaddd  $tmp,$tmp,$tmp2\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4714
            "movd    $tmp2,$src1\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4715
            "vpaddd  $tmp2,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4716
            "movd    $dst,$tmp2\t! mul reduction16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4717
  ins_encode %{
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4718
    __ vextracti64x4_high($tmp3$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4719
    __ vpaddd($tmp3$$XMMRegister, $tmp3$$XMMRegister, $src2$$XMMRegister, 1);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4720
    __ vextracti128_high($tmp$$XMMRegister, $tmp3$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4721
    __ vpaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp3$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4722
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4723
    __ vpaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4724
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0x1);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4725
    __ vpaddd($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, 0);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4726
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4727
    __ vpaddd($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, 0);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4728
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4729
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4730
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4731
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4732
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4733
#ifdef _LP64
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4734
instruct rvadd2L_reduction_reg(rRegL dst, rRegL src1, vecX src2, regF tmp, regF tmp2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4735
  predicate(UseAVX > 2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4736
  match(Set dst (AddReductionVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4737
  effect(TEMP tmp, TEMP tmp2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4738
  format %{ "pshufd  $tmp2,$src2,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4739
            "vpaddq  $tmp,$src2,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4740
            "movdq   $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4741
            "vpaddq  $tmp2,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4742
            "movdq   $dst,$tmp2\t! add reduction2L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4743
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4744
    __ pshufd($tmp2$$XMMRegister, $src2$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4745
    __ vpaddq($tmp$$XMMRegister, $src2$$XMMRegister, $tmp2$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4746
    __ movdq($tmp2$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4747
    __ vpaddq($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4748
    __ movdq($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4749
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4750
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4751
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4752
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4753
instruct rvadd4L_reduction_reg(rRegL dst, rRegL src1, vecY src2, regF tmp, regF tmp2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4754
  predicate(UseAVX > 2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4755
  match(Set dst (AddReductionVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4756
  effect(TEMP tmp, TEMP tmp2);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4757
  format %{ "vextracti128_high  $tmp,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4758
            "vpaddq  $tmp2,$tmp,$src2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4759
            "pshufd  $tmp,$tmp2,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4760
            "vpaddq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4761
            "movdq   $tmp,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4762
            "vpaddq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4763
            "movdq   $dst,$tmp2\t! add reduction4L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4764
  ins_encode %{
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4765
    __ vextracti128_high($tmp$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4766
    __ vpaddq($tmp2$$XMMRegister, $tmp$$XMMRegister, $src2$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4767
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4768
    __ vpaddq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4769
    __ movdq($tmp$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4770
    __ vpaddq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4771
    __ movdq($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4772
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4773
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4774
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4775
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4776
instruct rvadd8L_reduction_reg(rRegL dst, rRegL src1, vecZ src2, regF tmp, regF tmp2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4777
  predicate(UseAVX > 2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4778
  match(Set dst (AddReductionVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4779
  effect(TEMP tmp, TEMP tmp2);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4780
  format %{ "vextracti64x4_high  $tmp2,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4781
            "vpaddq  $tmp2,$tmp2,$src2\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4782
            "vextracti128_high  $tmp,$tmp2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4783
            "vpaddq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4784
            "pshufd  $tmp,$tmp2,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4785
            "vpaddq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4786
            "movdq   $tmp,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4787
            "vpaddq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4788
            "movdq   $dst,$tmp2\t! add reduction8L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4789
  ins_encode %{
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4790
    __ vextracti64x4_high($tmp2$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4791
    __ vpaddq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $src2$$XMMRegister, 1);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4792
    __ vextracti128_high($tmp$$XMMRegister, $tmp2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4793
    __ vpaddq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4794
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4795
    __ vpaddq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4796
    __ movdq($tmp$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4797
    __ vpaddq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4798
    __ movdq($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4799
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4800
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4801
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4802
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4803
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4804
instruct rsadd2F_reduction_reg(regF dst, vecD src2, regF tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4805
  predicate(UseSSE >= 1 && UseAVX == 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4806
  match(Set dst (AddReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4807
  effect(TEMP dst, TEMP tmp);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4808
  format %{ "addss   $dst,$src2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4809
            "pshufd  $tmp,$src2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4810
            "addss   $dst,$tmp\t! add reduction2F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4811
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4812
    __ addss($dst$$XMMRegister, $src2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4813
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4814
    __ addss($dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4815
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4816
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4817
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4818
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4819
instruct rvadd2F_reduction_reg(regF dst, vecD src2, regF tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4820
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4821
  match(Set dst (AddReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4822
  effect(TEMP dst, TEMP tmp);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4823
  format %{ "vaddss  $dst,$dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4824
            "pshufd  $tmp,$src2,0x01\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4825
            "vaddss  $dst,$dst,$tmp\t! add reduction2F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4826
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4827
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4828
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4829
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4830
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4831
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4832
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4833
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4834
instruct rsadd4F_reduction_reg(regF dst, vecX src2, regF tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4835
  predicate(UseSSE >= 1 && UseAVX == 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4836
  match(Set dst (AddReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4837
  effect(TEMP dst, TEMP tmp);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4838
  format %{ "addss   $dst,$src2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4839
            "pshufd  $tmp,$src2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4840
            "addss   $dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4841
            "pshufd  $tmp,$src2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4842
            "addss   $dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4843
            "pshufd  $tmp,$src2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4844
            "addss   $dst,$tmp\t! add reduction4F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4845
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4846
    __ addss($dst$$XMMRegister, $src2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4847
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4848
    __ addss($dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4849
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4850
    __ addss($dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4851
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4852
    __ addss($dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4853
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4854
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4855
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4856
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4857
instruct rvadd4F_reduction_reg(regF dst, vecX src2, regF tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4858
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4859
  match(Set dst (AddReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4860
  effect(TEMP tmp, TEMP dst);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4861
  format %{ "vaddss  $dst,dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4862
            "pshufd  $tmp,$src2,0x01\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4863
            "vaddss  $dst,$dst,$tmp\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4864
            "pshufd  $tmp,$src2,0x02\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4865
            "vaddss  $dst,$dst,$tmp\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4866
            "pshufd  $tmp,$src2,0x03\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4867
            "vaddss  $dst,$dst,$tmp\t! add reduction4F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4868
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4869
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4870
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4871
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4872
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x02);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4873
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4874
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x03);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4875
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4876
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4877
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4878
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4879
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4880
instruct radd8F_reduction_reg(regF dst, vecY src2, regF tmp, regF tmp2) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4881
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4882
  match(Set dst (AddReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4883
  effect(TEMP tmp, TEMP dst, TEMP tmp2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4884
  format %{ "vaddss  $dst,$dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4885
            "pshufd  $tmp,$src2,0x01\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4886
            "vaddss  $dst,$dst,$tmp\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4887
            "pshufd  $tmp,$src2,0x02\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4888
            "vaddss  $dst,$dst,$tmp\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4889
            "pshufd  $tmp,$src2,0x03\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4890
            "vaddss  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4891
            "vextractf128_high  $tmp2,$src2\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4892
            "vaddss  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4893
            "pshufd  $tmp,$tmp2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4894
            "vaddss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4895
            "pshufd  $tmp,$tmp2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4896
            "vaddss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4897
            "pshufd  $tmp,$tmp2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4898
            "vaddss  $dst,$dst,$tmp\t! add reduction8F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4899
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4900
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4901
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4902
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4903
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x02);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4904
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4905
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x03);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4906
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4907
    __ vextractf128_high($tmp2$$XMMRegister, $src2$$XMMRegister);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4908
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4909
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4910
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4911
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4912
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4913
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4914
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4915
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4916
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4917
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4918
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4919
instruct radd16F_reduction_reg(regF dst, vecZ src2, regF tmp, regF tmp2) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4920
  predicate(UseAVX > 2);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4921
  match(Set dst (AddReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4922
  effect(TEMP tmp, TEMP dst, TEMP tmp2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4923
  format %{ "vaddss  $dst,$dst,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4924
            "pshufd  $tmp,$src2,0x01\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4925
            "vaddss  $dst,$dst,$tmp\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4926
            "pshufd  $tmp,$src2,0x02\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4927
            "vaddss  $dst,$dst,$tmp\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4928
            "pshufd  $tmp,$src2,0x03\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4929
            "vaddss  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4930
            "vextractf32x4  $tmp2,$src2,0x1\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4931
            "vaddss  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4932
            "pshufd  $tmp,$tmp2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4933
            "vaddss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4934
            "pshufd  $tmp,$tmp2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4935
            "vaddss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4936
            "pshufd  $tmp,$tmp2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4937
            "vaddss  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4938
            "vextractf32x4  $tmp2,$src2,0x2\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4939
            "vaddss  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4940
            "pshufd  $tmp,$tmp2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4941
            "vaddss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4942
            "pshufd  $tmp,$tmp2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4943
            "vaddss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4944
            "pshufd  $tmp,$tmp2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4945
            "vaddss  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4946
            "vextractf32x4  $tmp2,$src2,0x3\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4947
            "vaddss  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4948
            "pshufd  $tmp,$tmp2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4949
            "vaddss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4950
            "pshufd  $tmp,$tmp2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4951
            "vaddss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4952
            "pshufd  $tmp,$tmp2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4953
            "vaddss  $dst,$dst,$tmp\t! add reduction16F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4954
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4955
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4956
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4957
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4958
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x02);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4959
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  4960
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x03);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4961
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4962
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x1);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4963
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4964
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4965
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4966
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4967
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4968
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4969
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4970
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x2);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4971
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4972
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4973
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4974
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4975
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4976
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4977
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  4978
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x3);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4979
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4980
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4981
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4982
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4983
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4984
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4985
    __ vaddss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4986
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4987
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4988
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4989
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4990
instruct rsadd2D_reduction_reg(regD dst, vecX src2, regD tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4991
  predicate(UseSSE >= 1 && UseAVX == 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4992
  match(Set dst (AddReductionVD dst src2));
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4993
  effect(TEMP tmp, TEMP dst);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4994
  format %{ "addsd   $dst,$src2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4995
            "pshufd  $tmp,$src2,0xE\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4996
            "addsd   $dst,$tmp\t! add reduction2D" %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  4997
  ins_encode %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4998
    __ addsd($dst$$XMMRegister, $src2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  4999
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0xE);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5000
    __ addsd($dst$$XMMRegister, $tmp$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5001
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5002
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5003
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5004
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5005
instruct rvadd2D_reduction_reg(regD dst, vecX src2, regD tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5006
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5007
  match(Set dst (AddReductionVD dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5008
  effect(TEMP tmp, TEMP dst);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5009
  format %{ "vaddsd  $dst,$dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5010
            "pshufd  $tmp,$src2,0xE\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5011
            "vaddsd  $dst,$dst,$tmp\t! add reduction2D" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5012
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5013
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5014
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0xE);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5015
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5016
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5017
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5018
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5019
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5020
instruct rvadd4D_reduction_reg(regD dst, vecY src2, regD tmp, regD tmp2) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5021
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5022
  match(Set dst (AddReductionVD dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5023
  effect(TEMP tmp, TEMP dst, TEMP tmp2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5024
  format %{ "vaddsd  $dst,$dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5025
            "pshufd  $tmp,$src2,0xE\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5026
            "vaddsd  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5027
            "vextractf32x4  $tmp2,$src2,0x1\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5028
            "vaddsd  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5029
            "pshufd  $tmp,$tmp2,0xE\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5030
            "vaddsd  $dst,$dst,$tmp\t! add reduction4D" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5031
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5032
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5033
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0xE);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5034
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5035
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x1);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5036
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5037
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5038
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5039
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5040
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5041
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5042
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5043
instruct rvadd8D_reduction_reg(regD dst, vecZ src2, regD tmp, regD tmp2) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5044
  predicate(UseAVX > 2);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5045
  match(Set dst (AddReductionVD dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5046
  effect(TEMP tmp, TEMP dst, TEMP tmp2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5047
  format %{ "vaddsd  $dst,$dst,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5048
            "pshufd  $tmp,$src2,0xE\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5049
            "vaddsd  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5050
            "vextractf32x4  $tmp2,$src2,0x1\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5051
            "vaddsd  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5052
            "pshufd  $tmp,$tmp2,0xE\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5053
            "vaddsd  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5054
            "vextractf32x4  $tmp2,$src2,0x2\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5055
            "vaddsd  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5056
            "pshufd  $tmp,$tmp2,0xE\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5057
            "vaddsd  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5058
            "vextractf32x4  $tmp2,$src2,0x3\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5059
            "vaddsd  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5060
            "pshufd  $tmp,$tmp2,0xE\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5061
            "vaddsd  $dst,$dst,$tmp\t! add reduction8D" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5062
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5063
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5064
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0xE);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5065
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5066
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x1);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5067
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5068
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5069
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5070
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x2);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5071
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5072
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5073
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5074
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x3);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5075
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5076
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5077
    __ vaddsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5078
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5079
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5080
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5081
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5082
instruct rsmul2I_reduction_reg(rRegI dst, rRegI src1, vecD src2, regF tmp, regF tmp2) %{
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5083
  predicate(UseSSE > 3 && UseAVX == 0);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5084
  match(Set dst (MulReductionVI src1 src2));
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5085
  effect(TEMP tmp, TEMP tmp2);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5086
  format %{ "pshufd  $tmp2,$src2,0x1\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5087
            "pmulld  $tmp2,$src2\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5088
            "movd    $tmp,$src1\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5089
            "pmulld  $tmp2,$tmp\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5090
            "movd    $dst,$tmp2\t! mul reduction2I" %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5091
  ins_encode %{
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5092
    __ pshufd($tmp2$$XMMRegister, $src2$$XMMRegister, 0x1);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5093
    __ pmulld($tmp2$$XMMRegister, $src2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5094
    __ movdl($tmp$$XMMRegister, $src1$$Register);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5095
    __ pmulld($tmp2$$XMMRegister, $tmp$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5096
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5097
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5098
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5099
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5100
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5101
instruct rvmul2I_reduction_reg(rRegI dst, rRegI src1, vecD src2, regF tmp, regF tmp2) %{
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5102
  predicate(UseAVX > 0);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5103
  match(Set dst (MulReductionVI src1 src2));
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5104
  effect(TEMP tmp, TEMP tmp2);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5105
  format %{ "pshufd   $tmp2,$src2,0x1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5106
            "vpmulld  $tmp,$src2,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5107
            "movd     $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5108
            "vpmulld  $tmp2,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5109
            "movd     $dst,$tmp2\t! mul reduction2I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5110
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5111
    int vector_len = 0;
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5112
    __ pshufd($tmp2$$XMMRegister, $src2$$XMMRegister, 0x1);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5113
    __ vpmulld($tmp$$XMMRegister, $src2$$XMMRegister, $tmp2$$XMMRegister, vector_len);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5114
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5115
    __ vpmulld($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5116
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5117
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5118
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5119
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5120
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5121
instruct rsmul4I_reduction_reg(rRegI dst, rRegI src1, vecX src2, regF tmp, regF tmp2) %{
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5122
  predicate(UseSSE > 3 && UseAVX == 0);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5123
  match(Set dst (MulReductionVI src1 src2));
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5124
  effect(TEMP tmp, TEMP tmp2);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5125
  format %{ "pshufd  $tmp2,$src2,0xE\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5126
            "pmulld  $tmp2,$src2\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5127
            "pshufd  $tmp,$tmp2,0x1\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5128
            "pmulld  $tmp2,$tmp\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5129
            "movd    $tmp,$src1\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5130
            "pmulld  $tmp2,$tmp\n\t"
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5131
            "movd    $dst,$tmp2\t! mul reduction4I" %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5132
  ins_encode %{
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5133
    __ pshufd($tmp2$$XMMRegister, $src2$$XMMRegister, 0xE);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5134
    __ pmulld($tmp2$$XMMRegister, $src2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5135
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x1);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5136
    __ pmulld($tmp2$$XMMRegister, $tmp$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5137
    __ movdl($tmp$$XMMRegister, $src1$$Register);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5138
    __ pmulld($tmp2$$XMMRegister, $tmp$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5139
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5140
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5141
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5142
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5143
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5144
instruct rvmul4I_reduction_reg(rRegI dst, rRegI src1, vecX src2, regF tmp, regF tmp2) %{
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5145
  predicate(UseAVX > 0);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5146
  match(Set dst (MulReductionVI src1 src2));
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5147
  effect(TEMP tmp, TEMP tmp2);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5148
  format %{ "pshufd   $tmp2,$src2,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5149
            "vpmulld  $tmp,$src2,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5150
            "pshufd   $tmp2,$tmp,0x1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5151
            "vpmulld  $tmp,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5152
            "movd     $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5153
            "vpmulld  $tmp2,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5154
            "movd     $dst,$tmp2\t! mul reduction4I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5155
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5156
    int vector_len = 0;
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5157
    __ pshufd($tmp2$$XMMRegister, $src2$$XMMRegister, 0xE);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5158
    __ vpmulld($tmp$$XMMRegister, $src2$$XMMRegister, $tmp2$$XMMRegister, vector_len);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5159
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0x1);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5160
    __ vpmulld($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5161
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5162
    __ vpmulld($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5163
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5164
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5165
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5166
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5167
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5168
instruct rvmul8I_reduction_reg(rRegI dst, rRegI src1, vecY src2, regF tmp, regF tmp2) %{
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5169
  predicate(UseAVX > 0);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5170
  match(Set dst (MulReductionVI src1 src2));
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5171
  effect(TEMP tmp, TEMP tmp2);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5172
  format %{ "vextracti128_high  $tmp,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5173
            "vpmulld  $tmp,$tmp,$src2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5174
            "pshufd   $tmp2,$tmp,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5175
            "vpmulld  $tmp,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5176
            "pshufd   $tmp2,$tmp,0x1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5177
            "vpmulld  $tmp,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5178
            "movd     $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5179
            "vpmulld  $tmp2,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5180
            "movd     $dst,$tmp2\t! mul reduction8I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5181
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5182
    int vector_len = 0;
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5183
    __ vextracti128_high($tmp$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5184
    __ vpmulld($tmp$$XMMRegister, $tmp$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5185
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5186
    __ vpmulld($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5187
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0x1);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5188
    __ vpmulld($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5189
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5190
    __ vpmulld($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5191
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5192
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5193
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5194
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5195
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5196
instruct rvmul16I_reduction_reg(rRegI dst, rRegI src1, vecZ src2, regF tmp, regF tmp2, regF tmp3) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5197
  predicate(UseAVX > 2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5198
  match(Set dst (MulReductionVI src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5199
  effect(TEMP tmp, TEMP tmp2, TEMP tmp3);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5200
  format %{ "vextracti64x4_high  $tmp3,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5201
            "vpmulld  $tmp3,$tmp3,$src2\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5202
            "vextracti128_high  $tmp,$tmp3\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5203
            "vpmulld  $tmp,$tmp,$src2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5204
            "pshufd   $tmp2,$tmp,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5205
            "vpmulld  $tmp,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5206
            "pshufd   $tmp2,$tmp,0x1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5207
            "vpmulld  $tmp,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5208
            "movd     $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5209
            "vpmulld  $tmp2,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5210
            "movd     $dst,$tmp2\t! mul reduction16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5211
  ins_encode %{
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5212
    __ vextracti64x4_high($tmp3$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5213
    __ vpmulld($tmp3$$XMMRegister, $tmp3$$XMMRegister, $src2$$XMMRegister, 1);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5214
    __ vextracti128_high($tmp$$XMMRegister, $tmp3$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5215
    __ vpmulld($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp3$$XMMRegister, 0);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5216
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0xE);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5217
    __ vpmulld($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, 0);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5218
    __ pshufd($tmp2$$XMMRegister, $tmp$$XMMRegister, 0x1);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5219
    __ vpmulld($tmp$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, 0);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5220
    __ movdl($tmp2$$XMMRegister, $src1$$Register);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5221
    __ vpmulld($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, 0);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5222
    __ movdl($dst$$Register, $tmp2$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5223
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5224
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5225
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5226
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5227
#ifdef _LP64
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5228
instruct rvmul2L_reduction_reg(rRegL dst, rRegL src1, vecX src2, regF tmp, regF tmp2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5229
  predicate(UseAVX > 2 && VM_Version::supports_avx512dq());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5230
  match(Set dst (MulReductionVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5231
  effect(TEMP tmp, TEMP tmp2);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5232
  format %{ "pshufd   $tmp2,$src2,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5233
            "vpmullq  $tmp,$src2,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5234
            "movdq    $tmp2,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5235
            "vpmullq  $tmp2,$tmp,$tmp2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5236
            "movdq    $dst,$tmp2\t! mul reduction2L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5237
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5238
    __ pshufd($tmp2$$XMMRegister, $src2$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5239
    __ vpmullq($tmp$$XMMRegister, $src2$$XMMRegister, $tmp2$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5240
    __ movdq($tmp2$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5241
    __ vpmullq($tmp2$$XMMRegister, $tmp$$XMMRegister, $tmp2$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5242
    __ movdq($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5243
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5244
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5245
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5246
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5247
instruct rvmul4L_reduction_reg(rRegL dst, rRegL src1, vecY src2, regF tmp, regF tmp2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5248
  predicate(UseAVX > 2 && VM_Version::supports_avx512dq());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5249
  match(Set dst (MulReductionVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5250
  effect(TEMP tmp, TEMP tmp2);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5251
  format %{ "vextracti128_high  $tmp,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5252
            "vpmullq  $tmp2,$tmp,$src2\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5253
            "pshufd   $tmp,$tmp2,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5254
            "vpmullq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5255
            "movdq    $tmp,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5256
            "vpmullq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5257
            "movdq    $dst,$tmp2\t! mul reduction4L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5258
  ins_encode %{
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5259
    __ vextracti128_high($tmp$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5260
    __ vpmullq($tmp2$$XMMRegister, $tmp$$XMMRegister, $src2$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5261
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5262
    __ vpmullq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5263
    __ movdq($tmp$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5264
    __ vpmullq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5265
    __ movdq($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5266
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5267
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5268
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5269
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5270
instruct rvmul8L_reduction_reg(rRegL dst, rRegL src1, vecZ src2, regF tmp, regF tmp2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5271
  predicate(UseAVX > 2 && VM_Version::supports_avx512dq());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5272
  match(Set dst (MulReductionVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5273
  effect(TEMP tmp, TEMP tmp2);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5274
  format %{ "vextracti64x4_high  $tmp2,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5275
            "vpmullq  $tmp2,$tmp2,$src2\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5276
            "vextracti128_high  $tmp,$tmp2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5277
            "vpmullq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5278
            "pshufd   $tmp,$tmp2,0xE\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5279
            "vpmullq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5280
            "movdq    $tmp,$src1\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5281
            "vpmullq  $tmp2,$tmp2,$tmp\n\t"
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5282
            "movdq    $dst,$tmp2\t! mul reduction8L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5283
  ins_encode %{
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5284
    __ vextracti64x4_high($tmp2$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5285
    __ vpmullq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $src2$$XMMRegister, 1);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5286
    __ vextracti128_high($tmp$$XMMRegister, $tmp2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5287
    __ vpmullq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5288
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5289
    __ vpmullq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5290
    __ movdq($tmp$$XMMRegister, $src1$$Register);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5291
    __ vpmullq($tmp2$$XMMRegister, $tmp2$$XMMRegister, $tmp$$XMMRegister, 0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5292
    __ movdq($dst$$Register, $tmp2$$XMMRegister);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5293
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5294
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5295
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5296
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5297
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5298
instruct rsmul2F_reduction(regF dst, vecD src2, regF tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5299
  predicate(UseSSE >= 1 && UseAVX == 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5300
  match(Set dst (MulReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5301
  effect(TEMP dst, TEMP tmp);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5302
  format %{ "mulss   $dst,$src2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5303
            "pshufd  $tmp,$src2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5304
            "mulss   $dst,$tmp\t! mul reduction2F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5305
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5306
    __ mulss($dst$$XMMRegister, $src2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5307
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5308
    __ mulss($dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5309
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5310
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5311
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5312
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5313
instruct rvmul2F_reduction_reg(regF dst, vecD src2, regF tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5314
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5315
  match(Set dst (MulReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5316
  effect(TEMP tmp, TEMP dst);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5317
  format %{ "vmulss  $dst,$dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5318
            "pshufd  $tmp,$src2,0x01\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5319
            "vmulss  $dst,$dst,$tmp\t! mul reduction2F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5320
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5321
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5322
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5323
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5324
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5325
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5326
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5327
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5328
instruct rsmul4F_reduction_reg(regF dst, vecX src2, regF tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5329
  predicate(UseSSE >= 1 && UseAVX == 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5330
  match(Set dst (MulReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5331
  effect(TEMP dst, TEMP tmp);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5332
  format %{ "mulss   $dst,$src2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5333
            "pshufd  $tmp,$src2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5334
            "mulss   $dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5335
            "pshufd  $tmp,$src2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5336
            "mulss   $dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5337
            "pshufd  $tmp,$src2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5338
            "mulss   $dst,$tmp\t! mul reduction4F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5339
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5340
    __ mulss($dst$$XMMRegister, $src2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5341
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5342
    __ mulss($dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5343
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5344
    __ mulss($dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5345
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5346
    __ mulss($dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5347
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5348
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5349
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5350
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5351
instruct rvmul4F_reduction_reg(regF dst, vecX src2, regF tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5352
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5353
  match(Set dst (MulReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5354
  effect(TEMP tmp, TEMP dst);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5355
  format %{ "vmulss  $dst,$dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5356
            "pshufd  $tmp,$src2,0x01\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5357
            "vmulss  $dst,$dst,$tmp\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5358
            "pshufd  $tmp,$src2,0x02\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5359
            "vmulss  $dst,$dst,$tmp\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5360
            "pshufd  $tmp,$src2,0x03\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5361
            "vmulss  $dst,$dst,$tmp\t! mul reduction4F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5362
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5363
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5364
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5365
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5366
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x02);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5367
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5368
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x03);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5369
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5370
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5371
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5372
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5373
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5374
instruct rvmul8F_reduction_reg(regF dst, vecY src2, regF tmp, regF tmp2) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5375
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5376
  match(Set dst (MulReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5377
  effect(TEMP tmp, TEMP dst, TEMP tmp2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5378
  format %{ "vmulss  $dst,$dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5379
            "pshufd  $tmp,$src2,0x01\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5380
            "vmulss  $dst,$dst,$tmp\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5381
            "pshufd  $tmp,$src2,0x02\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5382
            "vmulss  $dst,$dst,$tmp\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5383
            "pshufd  $tmp,$src2,0x03\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5384
            "vmulss  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5385
            "vextractf128_high  $tmp2,$src2\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5386
            "vmulss  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5387
            "pshufd  $tmp,$tmp2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5388
            "vmulss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5389
            "pshufd  $tmp,$tmp2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5390
            "vmulss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5391
            "pshufd  $tmp,$tmp2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5392
            "vmulss  $dst,$dst,$tmp\t! mul reduction8F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5393
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5394
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5395
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5396
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5397
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x02);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5398
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5399
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x03);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5400
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5401
    __ vextractf128_high($tmp2$$XMMRegister, $src2$$XMMRegister);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5402
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5403
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5404
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5405
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5406
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5407
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5408
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5409
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5410
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5411
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5412
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5413
instruct rvmul16F_reduction_reg(regF dst, vecZ src2, regF tmp, regF tmp2) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5414
  predicate(UseAVX > 2);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5415
  match(Set dst (MulReductionVF dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5416
  effect(TEMP tmp, TEMP dst, TEMP tmp2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5417
  format %{ "vmulss  $dst,$dst,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5418
            "pshufd  $tmp,$src2,0x01\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5419
            "vmulss  $dst,$dst,$tmp\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5420
            "pshufd  $tmp,$src2,0x02\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5421
            "vmulss  $dst,$dst,$tmp\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5422
            "pshufd  $tmp,$src2,0x03\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5423
            "vmulss  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5424
            "vextractf32x4  $tmp2,$src2,0x1\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5425
            "vmulss  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5426
            "pshufd  $tmp,$tmp2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5427
            "vmulss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5428
            "pshufd  $tmp,$tmp2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5429
            "vmulss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5430
            "pshufd  $tmp,$tmp2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5431
            "vmulss  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5432
            "vextractf32x4  $tmp2,$src2,0x2\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5433
            "vmulss  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5434
            "pshufd  $tmp,$tmp2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5435
            "vmulss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5436
            "pshufd  $tmp,$tmp2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5437
            "vmulss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5438
            "pshufd  $tmp,$tmp2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5439
            "vmulss  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5440
            "vextractf32x4  $tmp2,$src2,0x3\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5441
            "vmulss  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5442
            "pshufd  $tmp,$tmp2,0x01\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5443
            "vmulss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5444
            "pshufd  $tmp,$tmp2,0x02\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5445
            "vmulss  $dst,$dst,$tmp\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5446
            "pshufd  $tmp,$tmp2,0x03\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5447
            "vmulss  $dst,$dst,$tmp\t! mul reduction16F" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5448
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5449
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5450
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x01);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5451
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5452
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x02);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5453
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5454
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0x03);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5455
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5456
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x1);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5457
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5458
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5459
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5460
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5461
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5462
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5463
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5464
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x2);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5465
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5466
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5467
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5468
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5469
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5470
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5471
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5472
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x3);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5473
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5474
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x01);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5475
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5476
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x02);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5477
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5478
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0x03);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5479
    __ vmulss($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5480
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5481
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5482
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5483
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5484
instruct rsmul2D_reduction_reg(regD dst, vecX src2, regD tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5485
  predicate(UseSSE >= 1 && UseAVX == 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5486
  match(Set dst (MulReductionVD dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5487
  effect(TEMP dst, TEMP tmp);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5488
  format %{ "mulsd   $dst,$src2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5489
            "pshufd  $tmp,$src2,0xE\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5490
            "mulsd   $dst,$tmp\t! mul reduction2D" %}
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5491
  ins_encode %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5492
    __ mulsd($dst$$XMMRegister, $src2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5493
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0xE);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5494
    __ mulsd($dst$$XMMRegister, $tmp$$XMMRegister);
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5495
  %}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5496
  ins_pipe( pipe_slow );
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5497
%}
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5498
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5499
instruct rvmul2D_reduction_reg(regD dst, vecX src2, regD tmp) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5500
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5501
  match(Set dst (MulReductionVD dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5502
  effect(TEMP tmp, TEMP dst);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5503
  format %{ "vmulsd  $dst,$dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5504
            "pshufd  $tmp,$src2,0xE\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5505
            "vmulsd  $dst,$dst,$tmp\t! mul reduction2D" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5506
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5507
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5508
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0xE);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5509
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5510
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5511
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5512
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5513
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5514
instruct rvmul4D_reduction_reg(regD dst, vecY src2, regD tmp, regD tmp2) %{
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5515
  predicate(UseAVX > 0);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5516
  match(Set dst (MulReductionVD dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5517
  effect(TEMP tmp, TEMP dst, TEMP tmp2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5518
  format %{ "vmulsd  $dst,$dst,$src2\n\t"
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5519
            "pshufd  $tmp,$src2,0xE\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5520
            "vmulsd  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5521
            "vextractf128_high  $tmp2,$src2\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5522
            "vmulsd  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5523
            "pshufd  $tmp,$tmp2,0xE\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5524
            "vmulsd  $dst,$dst,$tmp\t! mul reduction4D" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5525
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5526
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30211
442fbbb31f75 8074981: Integer/FP scalar reduction optimization
kvn
parents: 25715
diff changeset
  5527
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0xE);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5528
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5529
    __ vextractf128_high($tmp2$$XMMRegister, $src2$$XMMRegister);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5530
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5531
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5532
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5533
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5534
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5535
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5536
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5537
instruct rvmul8D_reduction_reg(regD dst, vecZ src2, regD tmp, regD tmp2) %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5538
  predicate(UseAVX > 2);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5539
  match(Set dst (MulReductionVD dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5540
  effect(TEMP tmp, TEMP dst, TEMP tmp2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5541
  format %{ "vmulsd  $dst,$dst,$src2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5542
            "pshufd  $tmp,$src2,0xE\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5543
            "vmulsd  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5544
            "vextractf32x4  $tmp2,$src2,0x1\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5545
            "vmulsd  $dst,$dst,$tmp2\n\t"
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5546
            "pshufd  $tmp,$src2,0xE\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5547
            "vmulsd  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5548
            "vextractf32x4  $tmp2,$src2,0x2\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5549
            "vmulsd  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5550
            "pshufd  $tmp,$tmp2,0xE\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5551
            "vmulsd  $dst,$dst,$tmp\n\t"
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5552
            "vextractf32x4  $tmp2,$src2,0x3\n\t"
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5553
            "vmulsd  $dst,$dst,$tmp2\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5554
            "pshufd  $tmp,$tmp2,0xE\n\t"
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5555
            "vmulsd  $dst,$dst,$tmp\t! mul reduction8D" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5556
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5557
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $src2$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5558
    __ pshufd($tmp$$XMMRegister, $src2$$XMMRegister, 0xE);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5559
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5560
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x1);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5561
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5562
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5563
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5564
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x2);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5565
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5566
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5567
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 35581
diff changeset
  5568
    __ vextractf32x4($tmp2$$XMMRegister, $src2$$XMMRegister, 0x3);
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5569
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp2$$XMMRegister);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5570
    __ pshufd($tmp$$XMMRegister, $tmp2$$XMMRegister, 0xE);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5571
    __ vmulsd($dst$$XMMRegister, $dst$$XMMRegister, $tmp$$XMMRegister);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5572
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5573
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5574
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5575
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5576
// ====================VECTOR ARITHMETIC=======================================
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5577
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5578
// --------------------------------- ADD --------------------------------------
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5579
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5580
// Bytes vector add
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5581
instruct vadd4B(vecS dst, vecS src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5582
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5583
  match(Set dst (AddVB dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5584
  format %{ "paddb   $dst,$src\t! add packed4B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5585
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5586
    __ paddb($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5587
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5588
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5589
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5590
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5591
instruct vadd4B_reg_avx(vecS dst, vecS src1, vecS src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5592
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5593
  match(Set dst (AddVB src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5594
  format %{ "vpaddb  $dst,$src1,$src2\t! add packed4B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5595
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5596
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5597
    __ vpaddb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5598
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5599
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5600
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5601
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5602
instruct vadd4B_reg_evex(vecS dst, vecS src1, vecS src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5603
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5604
  match(Set dst (AddVB src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5605
  format %{ "vpaddb  $dst,$src1,$src2\t! add packed4B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5606
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5607
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5608
    __ vpaddb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5609
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5610
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5611
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5612
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5613
instruct vadd4B_reg_evex_special(vecS dst, vecS src1, vecS src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5614
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5615
  match(Set dst (AddVB dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5616
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5617
  format %{ "vpaddb  $dst,$dst,$src2\t! add packed4B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5618
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5619
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5620
    __ vpaddb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5621
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5622
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5623
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5624
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5625
instruct vadd4B_mem_avx(vecS dst, vecS src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5626
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 4);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5627
  match(Set dst (AddVB src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5628
  format %{ "vpaddb  $dst,$src,$mem\t! add packed4B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5629
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5630
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5631
    __ vpaddb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5632
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5633
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5634
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5635
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5636
instruct vadd4B_mem_evex(vecS dst, vecS src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5637
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5638
  match(Set dst (AddVB src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5639
  format %{ "vpaddb  $dst,$src,$mem\t! add packed4B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5640
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5641
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5642
    __ vpaddb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5643
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5644
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5645
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5646
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5647
instruct vadd4B_mem_evex_special(vecS dst, vecS src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5648
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5649
  match(Set dst (AddVB dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5650
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5651
  format %{ "vpaddb  $dst,$src,$mem\t! add packed4B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5652
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5653
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5654
    __ vpaddb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5655
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5656
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5657
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5658
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5659
instruct vadd8B(vecD dst, vecD src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5660
  predicate(UseAVX == 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5661
  match(Set dst (AddVB dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5662
  format %{ "paddb   $dst,$src\t! add packed8B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5663
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5664
    __ paddb($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5665
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5666
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5667
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5668
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5669
instruct vadd8B_reg_avx(vecD dst, vecD src1, vecD src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5670
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5671
  match(Set dst (AddVB src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5672
  format %{ "vpaddb  $dst,$src1,$src2\t! add packed8B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5673
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5674
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5675
    __ vpaddb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5676
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5677
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5678
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5679
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5680
instruct vadd8B_reg_evex(vecD dst, vecD src1, vecD src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5681
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5682
  match(Set dst (AddVB src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5683
  format %{ "vpaddb  $dst,$src1,$src2\t! add packed8B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5684
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5685
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5686
    __ vpaddb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5687
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5688
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5689
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5690
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5691
instruct vadd8B_reg_evex_special(vecD dst, vecD src1, vecD src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5692
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5693
  match(Set dst (AddVB dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5694
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5695
  format %{ "vpaddb  $dst,$dst,$src2\t! add packed8B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5696
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5697
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5698
    __ vpaddb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5699
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5700
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5701
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5702
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5703
instruct vadd8B_mem_avx(vecD dst, vecD src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5704
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 8);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5705
  match(Set dst (AddVB src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5706
  format %{ "vpaddb  $dst,$src,$mem\t! add packed8B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5707
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5708
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5709
    __ vpaddb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5710
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5711
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5712
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5713
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5714
instruct vadd8B_mem_evex(vecD dst, vecD src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5715
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5716
  match(Set dst (AddVB src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5717
  format %{ "vpaddb  $dst,$src,$mem\t! add packed8B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5718
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5719
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5720
    __ vpaddb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5721
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5722
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5723
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5724
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5725
instruct vadd8B_mem_evex_special(vecD dst, vecD src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5726
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5727
  match(Set dst (AddVB dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5728
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5729
  format %{ "vpaddb  $dst,$src,$mem\t! add packed8B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5730
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5731
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5732
    __ vpaddb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5733
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5734
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5735
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5736
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5737
instruct vadd16B(vecX dst, vecX src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5738
  predicate(UseAVX == 0 && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5739
  match(Set dst (AddVB dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5740
  format %{ "paddb   $dst,$src\t! add packed16B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5741
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5742
    __ paddb($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5743
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5744
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5745
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5746
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5747
instruct vadd16B_reg_avx(vecX dst, vecX src1, vecX src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5748
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5749
  match(Set dst (AddVB src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5750
  format %{ "vpaddb  $dst,$src1,$src2\t! add packed16B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5751
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5752
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5753
    __ vpaddb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5754
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5755
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5756
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5757
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5758
instruct vadd16B_reg_evex(vecX dst, vecX src1, vecX src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5759
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5760
  match(Set dst (AddVB src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5761
  format %{ "vpaddb  $dst,$src1,$src2\t! add packed16B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5762
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5763
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5764
    __ vpaddb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5765
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5766
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5767
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5768
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5769
instruct vadd16B_reg_evex_special(vecX dst, vecX src1, vecX src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5770
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5771
  match(Set dst (AddVB dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5772
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5773
  format %{ "vpaddb  $dst,$dst,$src2\t! add packed16B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5774
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5775
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5776
    __ vpaddb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5777
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5778
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5779
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5780
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5781
instruct vadd16B_mem_avx(vecX dst, vecX src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5782
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5783
  match(Set dst (AddVB src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5784
  format %{ "vpaddb  $dst,$src,$mem\t! add packed16B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5785
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5786
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5787
    __ vpaddb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5788
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5789
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5790
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5791
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5792
instruct vadd16B_mem_evex(vecX dst, vecX src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5793
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5794
  match(Set dst (AddVB src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5795
  format %{ "vpaddb  $dst,$src,$mem\t! add packed16B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5796
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5797
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5798
    __ vpaddb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5799
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5800
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5801
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5802
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5803
instruct vadd16B_mem_evex_special(vecX dst, vecX src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5804
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5805
  match(Set dst (AddVB dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5806
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5807
  format %{ "vpaddb  $dst,$src,$mem\t! add packed16B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5808
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5809
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5810
    __ vpaddb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5811
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5812
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5813
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5814
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5815
instruct vadd32B_reg_avx(vecY dst, vecY src1, vecY src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5816
  predicate(VM_Version::supports_avx256only() && n->as_Vector()->length() == 32);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5817
  match(Set dst (AddVB src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5818
  format %{ "vpaddb  $dst,$src1,$src2\t! add packed32B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5819
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5820
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5821
    __ vpaddb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5822
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5823
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5824
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5825
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5826
instruct vadd32B_reg_evex(vecY dst, vecY src1, vecY src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5827
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5828
  match(Set dst (AddVB src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5829
  format %{ "vpaddb  $dst,$src1,$src2\t! add packed32B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5830
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5831
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5832
    __ vpaddb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5833
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5834
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5835
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5836
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5837
instruct vadd32B_reg_evex_special(vecY dst, vecY src1, vecY src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5838
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 32);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5839
  match(Set dst (AddVB dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5840
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5841
  format %{ "vpaddb  $dst,$dst,$src2\t! add packed32B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5842
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5843
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5844
    __ vpaddb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5845
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5846
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5847
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5848
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5849
instruct vadd32B_mem_avx(vecY dst, vecY src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5850
  predicate(VM_Version::supports_avx256only() && n->as_Vector()->length() == 32);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5851
  match(Set dst (AddVB src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5852
  format %{ "vpaddb  $dst,$src,$mem\t! add packed32B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5853
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5854
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5855
    __ vpaddb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5856
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5857
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5858
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5859
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5860
instruct vadd32B_mem_evex(vecY dst, vecY src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5861
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5862
  match(Set dst (AddVB src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5863
  format %{ "vpaddb  $dst,$src,$mem\t! add packed32B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5864
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5865
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5866
    __ vpaddb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5867
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5868
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5869
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5870
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5871
instruct vadd32B_mem_evex_special(vecY dst, vecY src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5872
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5873
  match(Set dst (AddVB dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5874
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5875
  format %{ "vpaddb  $dst,$src,$mem\t! add packed32B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5876
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5877
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5878
    __ vpaddb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5879
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5880
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5881
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5882
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5883
instruct vadd64B_reg(vecZ dst, vecZ src1, vecZ src2) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5884
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 64);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5885
  match(Set dst (AddVB src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5886
  format %{ "vpaddb  $dst,$src1,$src2\t! add packed64B" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5887
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5888
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5889
    __ vpaddb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5890
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5891
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5892
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5893
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5894
instruct vadd64B_mem(vecZ dst, vecZ src, memory mem) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5895
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 64);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5896
  match(Set dst (AddVB src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5897
  format %{ "vpaddb  $dst,$src,$mem\t! add packed64B" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5898
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5899
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5900
    __ vpaddb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5901
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5902
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5903
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5904
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5905
// Shorts/Chars vector add
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5906
instruct vadd2S(vecS dst, vecS src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5907
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5908
  match(Set dst (AddVS dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5909
  format %{ "paddw   $dst,$src\t! add packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5910
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5911
    __ paddw($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5912
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5913
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5914
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5915
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5916
instruct vadd2S_reg_avx(vecS dst, vecS src1, vecS src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5917
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5918
  match(Set dst (AddVS src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5919
  format %{ "vpaddw  $dst,$src1,$src2\t! add packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5920
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5921
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5922
    __ vpaddw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5923
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5924
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5925
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5926
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5927
instruct vadd2S_reg_evex(vecS dst, vecS src1, vecS src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5928
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5929
  match(Set dst (AddVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5930
  format %{ "vpaddw  $dst,$src1,$src2\t! add packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5931
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5932
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  5933
    __ vpaddw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5934
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5935
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5936
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5937
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5938
instruct vadd2S_reg_evex_special(vecS dst, vecS src1, vecS src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5939
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5940
  match(Set dst (AddVS dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5941
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5942
  format %{ "vpaddw  $dst,$dst,$src2\t! add packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5943
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5944
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5945
    __ vpaddw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5946
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5947
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5948
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5949
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5950
instruct vadd2S_mem_avx(vecS dst, vecS src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5951
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 2);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5952
  match(Set dst (AddVS src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5953
  format %{ "vpaddw  $dst,$src,$mem\t! add packed2S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5954
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5955
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5956
    __ vpaddw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5957
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5958
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5959
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  5960
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5961
instruct vadd2S_mem_evex(vecS dst, vecS src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5962
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5963
  match(Set dst (AddVS src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5964
  format %{ "vpaddw  $dst,$src,$mem\t! add packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5965
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5966
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5967
    __ vpaddw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5968
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5969
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5970
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5971
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5972
instruct vadd2S_mem_evex_special(vecS dst, vecS src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5973
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5974
  match(Set dst (AddVS dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5975
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5976
  format %{ "vpaddw  $dst,$src,$mem\t! add packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5977
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5978
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5979
    __ vpaddw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5980
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5981
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5982
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5983
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5984
instruct vadd4S(vecD dst, vecD src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5985
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5986
  match(Set dst (AddVS dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5987
  format %{ "paddw   $dst,$src\t! add packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5988
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5989
    __ paddw($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5990
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5991
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5992
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  5993
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5994
instruct vadd4S_reg_avx(vecD dst, vecD src1, vecD src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5995
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5996
  match(Set dst (AddVS src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5997
  format %{ "vpaddw  $dst,$src1,$src2\t! add packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5998
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  5999
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6000
    __ vpaddw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6001
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6002
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6003
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6004
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6005
instruct vadd4S_reg_evex(vecD dst, vecD src1, vecD src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6006
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6007
  match(Set dst (AddVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6008
  format %{ "vpaddw  $dst,$src1,$src2\t! add packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6009
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6010
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6011
    __ vpaddw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6012
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6013
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6014
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6015
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6016
instruct vadd4S_reg_evex_special(vecD dst, vecD src1, vecD src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6017
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6018
  match(Set dst (AddVS dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6019
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6020
  format %{ "vpaddw  $dst,$dst,$src2\t! add packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6021
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6022
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6023
    __ vpaddw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6024
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6025
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6026
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6027
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6028
instruct vadd4S_mem_avx(vecD dst, vecD src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6029
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 4);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6030
  match(Set dst (AddVS src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6031
  format %{ "vpaddw  $dst,$src,$mem\t! add packed4S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6032
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6033
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6034
    __ vpaddw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6035
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6036
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6037
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6038
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6039
instruct vadd4S_mem_evex(vecD dst, vecD src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6040
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6041
  match(Set dst (AddVS src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6042
  format %{ "vpaddw  $dst,$src,$mem\t! add packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6043
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6044
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6045
    __ vpaddw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6046
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6047
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6048
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6049
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6050
instruct vadd4S_mem_evex_special(vecD dst, vecD src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6051
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6052
  match(Set dst (AddVS dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6053
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6054
  format %{ "vpaddw  $dst,$src,$mem\t! add packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6055
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6056
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6057
    __ vpaddw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6058
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6059
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6060
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6061
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6062
instruct vadd8S(vecX dst, vecX src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6063
  predicate(UseAVX == 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6064
  match(Set dst (AddVS dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6065
  format %{ "paddw   $dst,$src\t! add packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6066
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6067
    __ paddw($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6068
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6069
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6070
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6071
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6072
instruct vadd8S_reg_avx(vecX dst, vecX src1, vecX src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6073
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6074
  match(Set dst (AddVS src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6075
  format %{ "vpaddw  $dst,$src1,$src2\t! add packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6076
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6077
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6078
    __ vpaddw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6079
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6080
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6081
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6082
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6083
instruct vadd8S_reg_evex(vecX dst, vecX src1, vecX src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6084
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6085
  match(Set dst (AddVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6086
  format %{ "vpaddw  $dst,$src1,$src2\t! add packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6087
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6088
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6089
    __ vpaddw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6090
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6091
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6092
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6093
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6094
instruct vadd8S_reg_evex_special(vecX dst, vecX src1, vecX src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6095
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6096
  match(Set dst (AddVS dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6097
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6098
  format %{ "vpaddw  $dst,$dst,$src2\t! add packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6099
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6100
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6101
    __ vpaddw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6102
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6103
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6104
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6105
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6106
instruct vadd8S_mem_avx(vecX dst, vecX src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6107
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6108
  match(Set dst (AddVS src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6109
  format %{ "vpaddw  $dst,$src,$mem\t! add packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6110
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6111
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6112
    __ vpaddw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6113
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6114
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6115
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6116
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6117
instruct vadd8S_mem_evex(vecX dst, vecX src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6118
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6119
  match(Set dst (AddVS src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6120
  format %{ "vpaddw  $dst,$src,$mem\t! add packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6121
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6122
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6123
    __ vpaddw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6124
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6125
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6126
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6127
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6128
instruct vadd8S_mem_evex_special(vecX dst, vecX src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6129
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6130
  match(Set dst (AddVS dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6131
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6132
  format %{ "vpaddw  $dst,$src,$mem\t! add packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6133
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6134
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6135
    __ vpaddw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6136
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6137
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6138
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6139
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6140
instruct vadd16S_reg_avx(vecY dst, vecY src1, vecY src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6141
  predicate(VM_Version::supports_avx256only() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6142
  match(Set dst (AddVS src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6143
  format %{ "vpaddw  $dst,$src1,$src2\t! add packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6144
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6145
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6146
    __ vpaddw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6147
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6148
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6149
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6150
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6151
instruct vadd16S_reg_evex(vecY dst, vecY src1, vecY src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6152
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6153
  match(Set dst (AddVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6154
  format %{ "vpaddw  $dst,$src1,$src2\t! add packed16S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6155
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6156
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6157
    __ vpaddw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6158
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6159
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6160
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6161
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6162
instruct vadd16S_reg_evex_special(vecY dst, vecY src1, vecY src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6163
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6164
  match(Set dst (AddVS dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6165
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6166
  format %{ "vpaddw  $dst,$dst,$src2\t! add packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6167
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6168
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6169
    __ vpaddw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6170
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6171
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6172
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6173
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6174
instruct vadd16S_mem_avx(vecY dst, vecY src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6175
  predicate(VM_Version::supports_avx256only() && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6176
  match(Set dst (AddVS src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6177
  format %{ "vpaddw  $dst,$src,$mem\t! add packed16S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6178
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6179
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6180
    __ vpaddw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6181
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6182
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6183
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6184
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6185
instruct vadd16S_mem_evex(vecY dst, vecY src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6186
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6187
  match(Set dst (AddVS src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6188
  format %{ "vpaddw  $dst,$src,$mem\t! add packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6189
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6190
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6191
    __ vpaddw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6192
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6193
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6194
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6195
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6196
instruct vadd16S_mem_evex_special(vecY dst, vecY src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6197
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6198
  match(Set dst (AddVS dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6199
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6200
  format %{ "vpaddw  $dst,$src,$mem\t! add packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6201
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6202
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6203
    __ vpaddw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6204
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6205
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6206
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6207
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6208
instruct vadd32S_reg(vecZ dst, vecZ src1, vecZ src2) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6209
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6210
  match(Set dst (AddVS src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6211
  format %{ "vpaddw  $dst,$src1,$src2\t! add packed32S" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6212
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6213
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6214
    __ vpaddw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6215
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6216
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6217
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6218
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6219
instruct vadd32S_mem(vecZ dst, vecZ src, memory mem) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6220
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6221
  match(Set dst (AddVS src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6222
  format %{ "vpaddw  $dst,$src,$mem\t! add packed32S" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6223
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6224
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6225
    __ vpaddw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6226
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6227
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6228
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6229
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6230
// Integers vector add
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6231
instruct vadd2I(vecD dst, vecD src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6232
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6233
  match(Set dst (AddVI dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6234
  format %{ "paddd   $dst,$src\t! add packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6235
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6236
    __ paddd($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6237
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6238
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6239
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6240
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6241
instruct vadd2I_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6242
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6243
  match(Set dst (AddVI src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6244
  format %{ "vpaddd  $dst,$src1,$src2\t! add packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6245
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6246
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6247
    __ vpaddd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6248
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6249
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6250
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6251
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6252
instruct vadd2I_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6253
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6254
  match(Set dst (AddVI src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6255
  format %{ "vpaddd  $dst,$src,$mem\t! add packed2I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6256
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6257
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6258
    __ vpaddd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6259
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6260
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6261
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6262
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6263
instruct vadd4I(vecX dst, vecX src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6264
  predicate(n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6265
  match(Set dst (AddVI dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6266
  format %{ "paddd   $dst,$src\t! add packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6267
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6268
    __ paddd($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6269
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6270
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6271
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6272
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6273
instruct vadd4I_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6274
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6275
  match(Set dst (AddVI src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6276
  format %{ "vpaddd  $dst,$src1,$src2\t! add packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6277
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6278
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6279
    __ vpaddd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6280
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6281
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6282
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6283
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6284
instruct vadd4I_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6285
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6286
  match(Set dst (AddVI src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6287
  format %{ "vpaddd  $dst,$src,$mem\t! add packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6288
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6289
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6290
    __ vpaddd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6291
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6292
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6293
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6294
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6295
instruct vadd8I_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6296
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6297
  match(Set dst (AddVI src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6298
  format %{ "vpaddd  $dst,$src1,$src2\t! add packed8I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6299
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6300
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6301
    __ vpaddd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6302
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6303
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6304
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6305
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6306
instruct vadd8I_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6307
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6308
  match(Set dst (AddVI src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6309
  format %{ "vpaddd  $dst,$src,$mem\t! add packed8I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6310
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6311
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6312
    __ vpaddd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6313
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6314
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6315
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6316
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6317
instruct vadd16I_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6318
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6319
  match(Set dst (AddVI src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6320
  format %{ "vpaddd  $dst,$src1,$src2\t! add packed16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6321
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6322
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6323
    __ vpaddd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6324
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6325
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6326
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6327
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6328
instruct vadd16I_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6329
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6330
  match(Set dst (AddVI src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6331
  format %{ "vpaddd  $dst,$src,$mem\t! add packed16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6332
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6333
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6334
    __ vpaddd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6335
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6336
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6337
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6338
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6339
// Longs vector add
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6340
instruct vadd2L(vecX dst, vecX src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6341
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6342
  match(Set dst (AddVL dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6343
  format %{ "paddq   $dst,$src\t! add packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6344
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6345
    __ paddq($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6346
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6347
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6348
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6349
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6350
instruct vadd2L_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6351
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6352
  match(Set dst (AddVL src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6353
  format %{ "vpaddq  $dst,$src1,$src2\t! add packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6354
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6355
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6356
    __ vpaddq($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6357
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6358
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6359
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6360
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6361
instruct vadd2L_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6362
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6363
  match(Set dst (AddVL src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6364
  format %{ "vpaddq  $dst,$src,$mem\t! add packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6365
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6366
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6367
    __ vpaddq($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6368
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6369
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6370
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6371
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6372
instruct vadd4L_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6373
  predicate(UseAVX > 1 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6374
  match(Set dst (AddVL src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6375
  format %{ "vpaddq  $dst,$src1,$src2\t! add packed4L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6376
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6377
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6378
    __ vpaddq($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6379
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6380
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6381
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6382
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6383
instruct vadd4L_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6384
  predicate(UseAVX > 1 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6385
  match(Set dst (AddVL src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6386
  format %{ "vpaddq  $dst,$src,$mem\t! add packed4L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6387
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6388
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6389
    __ vpaddq($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6390
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6391
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6392
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6393
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6394
instruct vadd8L_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6395
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6396
  match(Set dst (AddVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6397
  format %{ "vpaddq  $dst,$src1,$src2\t! add packed8L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6398
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6399
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6400
    __ vpaddq($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6401
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6402
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6403
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6404
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6405
instruct vadd8L_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6406
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6407
  match(Set dst (AddVL src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6408
  format %{ "vpaddq  $dst,$src,$mem\t! add packed8L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6409
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6410
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6411
    __ vpaddq($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6412
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6413
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6414
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6415
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6416
// Floats vector add
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6417
instruct vadd2F(vecD dst, vecD src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6418
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6419
  match(Set dst (AddVF dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6420
  format %{ "addps   $dst,$src\t! add packed2F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6421
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6422
    __ addps($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6423
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6424
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6425
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6426
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6427
instruct vadd2F_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6428
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6429
  match(Set dst (AddVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6430
  format %{ "vaddps  $dst,$src1,$src2\t! add packed2F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6431
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6432
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6433
    __ vaddps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6434
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6435
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6436
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6437
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6438
instruct vadd2F_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6439
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6440
  match(Set dst (AddVF src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6441
  format %{ "vaddps  $dst,$src,$mem\t! add packed2F" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6442
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6443
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6444
    __ vaddps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6445
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6446
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6447
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6448
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6449
instruct vadd4F(vecX dst, vecX src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6450
  predicate(n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6451
  match(Set dst (AddVF dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6452
  format %{ "addps   $dst,$src\t! add packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6453
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6454
    __ addps($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6455
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6456
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6457
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6458
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6459
instruct vadd4F_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6460
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6461
  match(Set dst (AddVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6462
  format %{ "vaddps  $dst,$src1,$src2\t! add packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6463
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6464
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6465
    __ vaddps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6466
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6467
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6468
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6469
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6470
instruct vadd4F_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6471
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6472
  match(Set dst (AddVF src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6473
  format %{ "vaddps  $dst,$src,$mem\t! add packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6474
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6475
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6476
    __ vaddps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6477
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6478
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6479
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6480
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6481
instruct vadd8F_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6482
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6483
  match(Set dst (AddVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6484
  format %{ "vaddps  $dst,$src1,$src2\t! add packed8F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6485
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6486
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6487
    __ vaddps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6488
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6489
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6490
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6491
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6492
instruct vadd8F_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6493
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6494
  match(Set dst (AddVF src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6495
  format %{ "vaddps  $dst,$src,$mem\t! add packed8F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6496
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6497
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6498
    __ vaddps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6499
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6500
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6501
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6502
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6503
instruct vadd16F_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6504
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6505
  match(Set dst (AddVF src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6506
  format %{ "vaddps  $dst,$src1,$src2\t! add packed16F" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6507
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6508
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6509
    __ vaddps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6510
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6511
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6512
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6513
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6514
instruct vadd16F_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6515
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6516
  match(Set dst (AddVF src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6517
  format %{ "vaddps  $dst,$src,$mem\t! add packed16F" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6518
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6519
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6520
    __ vaddps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6521
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6522
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6523
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6524
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6525
// Doubles vector add
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6526
instruct vadd2D(vecX dst, vecX src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6527
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6528
  match(Set dst (AddVD dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6529
  format %{ "addpd   $dst,$src\t! add packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6530
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6531
    __ addpd($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6532
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6533
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6534
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6535
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6536
instruct vadd2D_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6537
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6538
  match(Set dst (AddVD src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6539
  format %{ "vaddpd  $dst,$src1,$src2\t! add packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6540
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6541
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6542
    __ vaddpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6543
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6544
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6545
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6546
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6547
instruct vadd2D_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6548
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6549
  match(Set dst (AddVD src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6550
  format %{ "vaddpd  $dst,$src,$mem\t! add packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6551
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6552
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6553
    __ vaddpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6554
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6555
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6556
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6557
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6558
instruct vadd4D_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6559
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6560
  match(Set dst (AddVD src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6561
  format %{ "vaddpd  $dst,$src1,$src2\t! add packed4D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6562
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6563
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6564
    __ vaddpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6565
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6566
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6567
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6568
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6569
instruct vadd4D_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6570
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6571
  match(Set dst (AddVD src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6572
  format %{ "vaddpd  $dst,$src,$mem\t! add packed4D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6573
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6574
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6575
    __ vaddpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6576
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6577
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6578
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6579
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6580
instruct vadd8D_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6581
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6582
  match(Set dst (AddVD src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6583
  format %{ "vaddpd  $dst,$src1,$src2\t! add packed8D" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6584
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6585
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6586
    __ vaddpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6587
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6588
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6589
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6590
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6591
instruct vadd8D_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6592
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6593
  match(Set dst (AddVD src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6594
  format %{ "vaddpd  $dst,$src,$mem\t! add packed8D" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6595
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6596
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6597
    __ vaddpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6598
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6599
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6600
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6601
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6602
// --------------------------------- SUB --------------------------------------
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6603
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6604
// Bytes vector sub
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6605
instruct vsub4B(vecS dst, vecS src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6606
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6607
  match(Set dst (SubVB dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6608
  format %{ "psubb   $dst,$src\t! sub packed4B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6609
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6610
    __ psubb($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6611
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6612
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6613
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6614
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6615
instruct vsub4B_reg_avx(vecS dst, vecS src1, vecS src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6616
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6617
  match(Set dst (SubVB src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6618
  format %{ "vpsubb  $dst,$src1,$src2\t! sub packed4B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6619
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6620
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6621
    __ vpsubb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6622
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6623
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6624
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6625
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6626
instruct vsub4B_reg_evex(vecS dst, vecS src1, vecS src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6627
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6628
  match(Set dst (SubVB src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6629
  format %{ "vpsubb  $dst,$src1,$src2\t! sub packed4B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6630
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6631
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6632
    __ vpsubb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6633
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6634
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6635
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6636
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6637
instruct vsub4B_reg_exex_special(vecS dst, vecS src1, vecS src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6638
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6639
  match(Set dst (SubVB dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6640
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6641
  format %{ "vpsubb  $dst,$src1,$src2\t! sub packed4B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6642
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6643
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6644
    __ vpsubb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6645
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6646
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6647
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6648
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6649
instruct vsub4B_mem_avx(vecS dst, vecS src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6650
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 4);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6651
  match(Set dst (SubVB src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6652
  format %{ "vpsubb  $dst,$src,$mem\t! sub packed4B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6653
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6654
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6655
    __ vpsubb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6656
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6657
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6658
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6659
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6660
instruct vsub4B_mem_evex(vecS dst, vecS src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6661
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6662
  match(Set dst (SubVB src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6663
  format %{ "vpsubb  $dst,$src,$mem\t! sub packed4B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6664
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6665
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6666
    __ vpsubb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6667
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6668
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6669
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6670
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6671
instruct vsub4B_mem_evex_special(vecS dst, vecS src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6672
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6673
  match(Set dst (SubVB dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6674
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6675
  format %{ "vpsubb  $dst,$src,$mem\t! sub packed4B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6676
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6677
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6678
    __ vpsubb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6679
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6680
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6681
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6682
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6683
instruct vsub8B(vecD dst, vecD src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6684
  predicate(UseAVX == 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6685
  match(Set dst (SubVB dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6686
  format %{ "psubb   $dst,$src\t! sub packed8B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6687
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6688
    __ psubb($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6689
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6690
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6691
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6692
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6693
instruct vsub8B_reg_avx(vecD dst, vecD src1, vecD src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6694
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6695
  match(Set dst (SubVB src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6696
  format %{ "vpsubb  $dst,$src1,$src2\t! sub packed8B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6697
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6698
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6699
    __ vpsubb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6700
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6701
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6702
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6703
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6704
instruct vsub8B_reg_evex(vecD dst, vecD src1, vecD src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6705
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6706
  match(Set dst (SubVB src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6707
  format %{ "vpsubb  $dst,$src1,$src2\t! sub packed8B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6708
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6709
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6710
    __ vpsubb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6711
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6712
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6713
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6714
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6715
instruct vsub8B_reg_evex_special(vecD dst, vecD src1, vecD src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6716
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6717
  match(Set dst (SubVB dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6718
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6719
  format %{ "vpsubb  $dst,$src1,$src2\t! sub packed8B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6720
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6721
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6722
    __ vpsubb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6723
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6724
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6725
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6726
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6727
instruct vsub8B_mem_avx(vecD dst, vecD src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6728
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 8);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6729
  match(Set dst (SubVB src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6730
  format %{ "vpsubb  $dst,$src,$mem\t! sub packed8B" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6731
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6732
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6733
    __ vpsubb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6734
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6735
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6736
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6737
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6738
instruct vsub8B_mem_evex(vecD dst, vecD src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6739
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6740
  match(Set dst (SubVB src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6741
  format %{ "vpsubb  $dst,$src,$mem\t! sub packed8B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6742
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6743
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6744
    __ vpsubb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6745
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6746
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6747
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6748
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6749
instruct vsub8B_mem_evex_special(vecD dst, vecD src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6750
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6751
  match(Set dst (SubVB dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6752
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6753
  format %{ "vpsubb  $dst,$src,$mem\t! sub packed8B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6754
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6755
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6756
    __ vpsubb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6757
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6758
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6759
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6760
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6761
instruct vsub16B(vecX dst, vecX src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6762
  predicate(UseAVX == 0 && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6763
  match(Set dst (SubVB dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6764
  format %{ "psubb   $dst,$src\t! sub packed16B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6765
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6766
    __ psubb($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6767
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6768
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6769
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6770
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6771
instruct vsub16B_reg_avx(vecX dst, vecX src1, vecX src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6772
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6773
  match(Set dst (SubVB src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6774
  format %{ "vpsubb  $dst,$src1,$src2\t! sub packed16B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6775
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6776
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6777
    __ vpsubb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6778
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6779
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6780
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6781
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6782
instruct vsub16B_reg_evex(vecX dst, vecX src1, vecX src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6783
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6784
  match(Set dst (SubVB src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6785
  format %{ "vpsubb  $dst,$src1,$src2\t! sub packed16B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6786
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6787
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6788
    __ vpsubb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6789
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6790
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6791
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6792
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6793
instruct vsub16B_reg_evex_special(vecX dst, vecX src1, vecX src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6794
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6795
  match(Set dst (SubVB dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6796
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6797
  format %{ "vpsubb  $dst,$src1,$src2\t! sub packed16B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6798
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6799
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6800
    __ vpsubb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6801
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6802
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6803
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6804
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6805
instruct vsub16B_mem_avx(vecX dst, vecX src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6806
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6807
  match(Set dst (SubVB src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6808
  format %{ "vpsubb  $dst,$src,$mem\t! sub packed16B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6809
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6810
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6811
    __ vpsubb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6812
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6813
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6814
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6815
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6816
instruct vsub16B_mem_evex(vecX dst, vecX src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6817
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6818
  match(Set dst (SubVB src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6819
  format %{ "vpsubb  $dst,$src,$mem\t! sub packed16B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6820
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6821
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6822
    __ vpsubb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6823
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6824
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6825
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6826
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6827
instruct vsub16B_mem_evex_special(vecX dst, vecX src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6828
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6829
  match(Set dst (SubVB dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6830
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6831
  format %{ "vpsubb  $dst,$src,$mem\t! sub packed16B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6832
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6833
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6834
    __ vpsubb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6835
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6836
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6837
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6838
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6839
instruct vsub32B_reg_avx(vecY dst, vecY src1, vecY src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6840
  predicate(VM_Version::supports_avx256only() && n->as_Vector()->length() == 32);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6841
  match(Set dst (SubVB src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6842
  format %{ "vpsubb  $dst,$src1,$src2\t! sub packed32B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6843
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6844
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6845
    __ vpsubb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6846
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6847
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6848
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6849
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6850
instruct vsub32B_reg_evex(vecY dst, vecY src1, vecY src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6851
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6852
  match(Set dst (SubVB src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6853
  format %{ "vpsubb  $dst,$src1,$src2\t! sub packed32B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6854
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6855
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6856
    __ vpsubb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6857
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6858
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6859
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6860
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6861
instruct vsub32B_reg_evex_special(vecY dst, vecY src1, vecY src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6862
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 32);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6863
  match(Set dst (SubVB dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6864
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6865
  format %{ "vpsubb  $dst,$src1,$src2\t! sub packed32B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6866
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6867
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6868
    __ vpsubb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6869
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6870
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6871
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6872
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6873
instruct vsub32B_mem_avx(vecY dst, vecY src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6874
  predicate(VM_Version::supports_avx256only() && n->as_Vector()->length() == 32);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6875
  match(Set dst (SubVB src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6876
  format %{ "vpsubb  $dst,$src,$mem\t! sub packed32B" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6877
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6878
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6879
    __ vpsubb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6880
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6881
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6882
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6883
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6884
instruct vsub32B_mem_evex(vecY dst, vecY src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6885
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6886
  match(Set dst (SubVB src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6887
  format %{ "vpsubb  $dst,$src,$mem\t! sub packed32B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6888
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6889
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6890
    __ vpsubb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6891
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6892
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6893
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6894
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6895
instruct vsub32B_mem_evex_special(vecY dst, vecY src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6896
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 32);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6897
  match(Set dst (SubVB dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6898
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6899
  format %{ "vpsubb  $dst,$src,$mem\t! sub packed32B" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6900
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6901
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6902
    __ vpsubb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6903
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6904
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6905
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6906
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6907
instruct vsub64B_reg(vecZ dst, vecZ src1, vecZ src2) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6908
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 64);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6909
  match(Set dst (SubVB src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6910
  format %{ "vpsubb  $dst,$src1,$src2\t! sub packed64B" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6911
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6912
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6913
    __ vpsubb($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6914
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6915
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6916
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6917
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6918
instruct vsub64B_mem(vecZ dst, vecZ src, memory mem) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6919
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 64);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6920
  match(Set dst (SubVB src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6921
  format %{ "vpsubb  $dst,$src,$mem\t! sub packed64B" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6922
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6923
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6924
    __ vpsubb($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6925
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6926
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6927
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6928
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6929
// Shorts/Chars vector sub
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6930
instruct vsub2S(vecS dst, vecS src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6931
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6932
  match(Set dst (SubVS dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6933
  format %{ "psubw   $dst,$src\t! sub packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6934
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6935
    __ psubw($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6936
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6937
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6938
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6939
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6940
instruct vsub2S_reg_avx(vecS dst, vecS src1, vecS src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6941
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6942
  match(Set dst (SubVS src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6943
  format %{ "vpsubw  $dst,$src1,$src2\t! sub packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6944
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6945
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6946
    __ vpsubw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6947
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6948
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6949
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6950
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6951
instruct vsub2S_reg_evex(vecS dst, vecS src1, vecS src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6952
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6953
  match(Set dst (SubVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6954
  format %{ "vpsubw  $dst,$src1,$src2\t! sub packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6955
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6956
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  6957
    __ vpsubw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6958
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6959
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6960
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  6961
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6962
instruct vsub2S_reg_evex_special(vecS dst, vecS src1, vecS src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6963
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6964
  match(Set dst (SubVS dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6965
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6966
  format %{ "vpsubw  $dst,$src1,$src2\t! sub packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6967
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6968
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6969
    __ vpsubw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6970
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6971
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6972
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6973
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6974
instruct vsub2S_mem_avx(vecS dst, vecS src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6975
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 2);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6976
  match(Set dst (SubVS src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6977
  format %{ "vpsubw  $dst,$src,$mem\t! sub packed2S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6978
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6979
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6980
    __ vpsubw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6981
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6982
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6983
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  6984
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6985
instruct vsub2S_mem_evex(vecS dst, vecS src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6986
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6987
  match(Set dst (SubVS src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6988
  format %{ "vpsubw  $dst,$src,$mem\t! sub packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6989
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6990
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6991
    __ vpsubw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6992
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6993
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6994
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6995
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6996
instruct vsub2S_mem_evex_special(vecS dst, vecS src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6997
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6998
  match(Set dst (SubVS dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  6999
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7000
  format %{ "vpsubw  $dst,$src,$mem\t! sub packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7001
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7002
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7003
    __ vpsubw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7004
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7005
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7006
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7007
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7008
instruct vsub4S(vecD dst, vecD src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7009
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7010
  match(Set dst (SubVS dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7011
  format %{ "psubw   $dst,$src\t! sub packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7012
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7013
    __ psubw($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7014
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7015
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7016
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7017
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7018
instruct vsub4S_reg_avx(vecD dst, vecD src1, vecD src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7019
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7020
  match(Set dst (SubVS src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7021
  format %{ "vpsubw  $dst,$src1,$src2\t! sub packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7022
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7023
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7024
    __ vpsubw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7025
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7026
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7027
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7028
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7029
instruct vsub4S_reg_evex(vecD dst, vecD src1, vecD src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7030
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7031
  match(Set dst (SubVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7032
  format %{ "vpsubw  $dst,$src1,$src2\t! sub packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7033
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7034
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7035
    __ vpsubw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7036
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7037
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7038
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7039
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7040
instruct vsub4S_reg_evex_special(vecD dst, vecD src1, vecD src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7041
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7042
  match(Set dst (SubVS dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7043
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7044
  format %{ "vpsubw  $dst,$src1,$src2\t! sub packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7045
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7046
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7047
    __ vpsubw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7048
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7049
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7050
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7051
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7052
instruct vsub4S_mem_avx(vecD dst, vecD src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7053
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 4);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7054
  match(Set dst (SubVS src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7055
  format %{ "vpsubw  $dst,$src,$mem\t! sub packed4S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7056
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7057
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7058
    __ vpsubw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7059
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7060
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7061
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7062
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7063
instruct vsub4S_mem_evex(vecD dst, vecD src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7064
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7065
  match(Set dst (SubVS src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7066
  format %{ "vpsubw  $dst,$src,$mem\t! sub packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7067
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7068
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7069
    __ vpsubw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7070
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7071
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7072
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7073
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7074
instruct vsub4S_mem_evex_special(vecD dst, vecD src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7075
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7076
  match(Set dst (SubVS dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7077
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7078
  format %{ "vpsubw  $dst,$src,$mem\t! sub packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7079
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7080
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7081
    __ vpsubw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7082
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7083
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7084
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7085
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7086
instruct vsub8S(vecX dst, vecX src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7087
  predicate(UseAVX == 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7088
  match(Set dst (SubVS dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7089
  format %{ "psubw   $dst,$src\t! sub packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7090
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7091
    __ psubw($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7092
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7093
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7094
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7095
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7096
instruct vsub8S_reg_avx(vecX dst, vecX src1, vecX src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7097
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7098
  match(Set dst (SubVS src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7099
  format %{ "vpsubw  $dst,$src1,$src2\t! sub packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7100
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7101
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7102
    __ vpsubw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7103
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7104
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7105
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7106
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7107
instruct vsub8S_reg_evex(vecX dst, vecX src1, vecX src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7108
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7109
  match(Set dst (SubVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7110
  format %{ "vpsubw  $dst,$src1,$src2\t! sub packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7111
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7112
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7113
    __ vpsubw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7114
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7115
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7116
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7117
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7118
instruct vsub8S_reg_evex_special(vecX dst, vecX src1, vecX src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7119
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7120
  match(Set dst (SubVS dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7121
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7122
  format %{ "vpsubw  $dst,$src1,$src2\t! sub packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7123
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7124
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7125
    __ vpsubw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7126
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7127
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7128
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7129
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7130
instruct vsub8S_mem_avx(vecX dst, vecX src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7131
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7132
  match(Set dst (SubVS src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7133
  format %{ "vpsubw  $dst,$src,$mem\t! sub packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7134
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7135
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7136
    __ vpsubw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7137
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7138
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7139
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7140
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7141
instruct vsub8S_mem_evex(vecX dst, vecX src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7142
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7143
  match(Set dst (SubVS src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7144
  format %{ "vpsubw  $dst,$src,$mem\t! sub packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7145
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7146
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7147
    __ vpsubw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7148
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7149
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7150
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7151
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7152
instruct vsub8S_mem_evex_special(vecX dst, vecX src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7153
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7154
  match(Set dst (SubVS dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7155
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7156
  format %{ "vpsubw  $dst,$src,$mem\t! sub packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7157
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7158
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7159
    __ vpsubw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7160
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7161
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7162
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7163
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7164
instruct vsub16S_reg_avx(vecY dst, vecY src1, vecY src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7165
  predicate(VM_Version::supports_avx256only() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7166
  match(Set dst (SubVS src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7167
  format %{ "vpsubw  $dst,$src1,$src2\t! sub packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7168
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7169
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7170
    __ vpsubw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7171
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7172
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7173
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7174
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7175
instruct vsub16S_reg_evex(vecY dst, vecY src1, vecY src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7176
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7177
  match(Set dst (SubVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7178
  format %{ "vpsubw  $dst,$src1,$src2\t! sub packed16S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7179
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7180
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7181
    __ vpsubw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7182
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7183
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7184
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7185
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7186
instruct vsub16S_reg_evex_special(vecY dst, vecY src1, vecY src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7187
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7188
  match(Set dst (SubVS dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7189
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7190
  format %{ "vpsubw  $dst,$src1,$src2\t! sub packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7191
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7192
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7193
    __ vpsubw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7194
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7195
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7196
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7197
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7198
instruct vsub16S_mem_avx(vecY dst, vecY src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7199
  predicate(VM_Version::supports_avx256only() && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7200
  match(Set dst (SubVS src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7201
  format %{ "vpsubw  $dst,$src,$mem\t! sub packed16S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7202
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7203
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7204
    __ vpsubw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7205
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7206
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7207
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7208
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7209
instruct vsub16S_mem_evex(vecY dst, vecY src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7210
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7211
  match(Set dst (SubVS src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7212
  format %{ "vpsubw  $dst,$src,$mem\t! sub packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7213
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7214
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7215
    __ vpsubw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7216
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7217
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7218
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7219
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7220
instruct vsub16S_mem_evex_special(vecY dst, vecY src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7221
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7222
  match(Set dst (SubVS dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7223
   effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7224
  format %{ "vpsubw  $dst,$src,$mem\t! sub packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7225
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7226
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7227
    __ vpsubw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7228
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7229
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7230
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7231
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7232
instruct vsub32S_reg(vecZ dst, vecZ src1, vecZ src2) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7233
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7234
  match(Set dst (SubVS src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7235
  format %{ "vpsubw  $dst,$src1,$src2\t! sub packed32S" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7236
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7237
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7238
    __ vpsubw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7239
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7240
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7241
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7242
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7243
instruct vsub32S_mem(vecZ dst, vecZ src, memory mem) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7244
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7245
  match(Set dst (SubVS src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7246
  format %{ "vpsubw  $dst,$src,$mem\t! sub packed32S" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7247
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7248
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7249
    __ vpsubw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7250
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7251
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7252
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7253
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7254
// Integers vector sub
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7255
instruct vsub2I(vecD dst, vecD src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7256
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7257
  match(Set dst (SubVI dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7258
  format %{ "psubd   $dst,$src\t! sub packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7259
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7260
    __ psubd($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7261
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7262
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7263
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7264
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7265
instruct vsub2I_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7266
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7267
  match(Set dst (SubVI src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7268
  format %{ "vpsubd  $dst,$src1,$src2\t! sub packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7269
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7270
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7271
    __ vpsubd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7272
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7273
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7274
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7275
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7276
instruct vsub2I_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7277
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7278
  match(Set dst (SubVI src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7279
  format %{ "vpsubd  $dst,$src,$mem\t! sub packed2I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7280
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7281
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7282
    __ vpsubd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7283
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7284
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7285
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7286
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7287
instruct vsub4I(vecX dst, vecX src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7288
  predicate(n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7289
  match(Set dst (SubVI dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7290
  format %{ "psubd   $dst,$src\t! sub packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7291
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7292
    __ psubd($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7293
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7294
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7295
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7296
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7297
instruct vsub4I_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7298
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7299
  match(Set dst (SubVI src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7300
  format %{ "vpsubd  $dst,$src1,$src2\t! sub packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7301
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7302
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7303
    __ vpsubd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7304
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7305
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7306
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7307
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7308
instruct vsub4I_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7309
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7310
  match(Set dst (SubVI src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7311
  format %{ "vpsubd  $dst,$src,$mem\t! sub packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7312
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7313
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7314
    __ vpsubd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7315
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7316
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7317
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7318
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7319
instruct vsub8I_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7320
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7321
  match(Set dst (SubVI src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7322
  format %{ "vpsubd  $dst,$src1,$src2\t! sub packed8I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7323
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7324
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7325
    __ vpsubd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7326
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7327
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7328
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7329
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7330
instruct vsub8I_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7331
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7332
  match(Set dst (SubVI src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7333
  format %{ "vpsubd  $dst,$src,$mem\t! sub packed8I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7334
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7335
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7336
    __ vpsubd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7337
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7338
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7339
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7340
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7341
instruct vsub16I_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7342
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7343
  match(Set dst (SubVI src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7344
  format %{ "vpsubd  $dst,$src1,$src2\t! sub packed16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7345
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7346
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7347
    __ vpsubd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7348
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7349
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7350
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7351
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7352
instruct vsub16I_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7353
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7354
  match(Set dst (SubVI src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7355
  format %{ "vpsubd  $dst,$src,$mem\t! sub packed16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7356
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7357
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7358
    __ vpsubd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7359
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7360
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7361
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7362
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7363
// Longs vector sub
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7364
instruct vsub2L(vecX dst, vecX src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7365
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7366
  match(Set dst (SubVL dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7367
  format %{ "psubq   $dst,$src\t! sub packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7368
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7369
    __ psubq($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7370
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7371
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7372
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7373
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7374
instruct vsub2L_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7375
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7376
  match(Set dst (SubVL src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7377
  format %{ "vpsubq  $dst,$src1,$src2\t! sub packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7378
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7379
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7380
    __ vpsubq($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7381
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7382
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7383
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7384
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7385
instruct vsub2L_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7386
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7387
  match(Set dst (SubVL src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7388
  format %{ "vpsubq  $dst,$src,$mem\t! sub packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7389
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7390
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7391
    __ vpsubq($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7392
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7393
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7394
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7395
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7396
instruct vsub4L_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7397
  predicate(UseAVX > 1 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7398
  match(Set dst (SubVL src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7399
  format %{ "vpsubq  $dst,$src1,$src2\t! sub packed4L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7400
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7401
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7402
    __ vpsubq($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7403
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7404
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7405
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7406
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7407
instruct vsub4L_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7408
  predicate(UseAVX > 1 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7409
  match(Set dst (SubVL src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7410
  format %{ "vpsubq  $dst,$src,$mem\t! sub packed4L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7411
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7412
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7413
    __ vpsubq($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7414
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7415
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7416
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7417
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7418
instruct vsub8L_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7419
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7420
  match(Set dst (SubVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7421
  format %{ "vpsubq  $dst,$src1,$src2\t! sub packed8L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7422
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7423
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7424
    __ vpsubq($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7425
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7426
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7427
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7428
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7429
instruct vsub8L_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7430
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7431
  match(Set dst (SubVL src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7432
  format %{ "vpsubq  $dst,$src,$mem\t! sub packed8L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7433
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7434
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7435
    __ vpsubq($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7436
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7437
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7438
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7439
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7440
// Floats vector sub
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7441
instruct vsub2F(vecD dst, vecD src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7442
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7443
  match(Set dst (SubVF dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7444
  format %{ "subps   $dst,$src\t! sub packed2F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7445
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7446
    __ subps($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7447
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7448
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7449
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7450
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7451
instruct vsub2F_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7452
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7453
  match(Set dst (SubVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7454
  format %{ "vsubps  $dst,$src1,$src2\t! sub packed2F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7455
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7456
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7457
    __ vsubps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7458
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7459
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7460
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7461
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7462
instruct vsub2F_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7463
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7464
  match(Set dst (SubVF src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7465
  format %{ "vsubps  $dst,$src,$mem\t! sub packed2F" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7466
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7467
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7468
    __ vsubps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7469
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7470
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7471
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7472
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7473
instruct vsub4F(vecX dst, vecX src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7474
  predicate(n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7475
  match(Set dst (SubVF dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7476
  format %{ "subps   $dst,$src\t! sub packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7477
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7478
    __ subps($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7479
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7480
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7481
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7482
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7483
instruct vsub4F_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7484
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7485
  match(Set dst (SubVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7486
  format %{ "vsubps  $dst,$src1,$src2\t! sub packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7487
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7488
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7489
    __ vsubps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7490
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7491
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7492
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7493
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7494
instruct vsub4F_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7495
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7496
  match(Set dst (SubVF src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7497
  format %{ "vsubps  $dst,$src,$mem\t! sub packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7498
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7499
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7500
    __ vsubps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7501
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7502
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7503
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7504
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7505
instruct vsub8F_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7506
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7507
  match(Set dst (SubVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7508
  format %{ "vsubps  $dst,$src1,$src2\t! sub packed8F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7509
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7510
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7511
    __ vsubps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7512
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7513
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7514
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7515
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7516
instruct vsub8F_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7517
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7518
  match(Set dst (SubVF src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7519
  format %{ "vsubps  $dst,$src,$mem\t! sub packed8F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7520
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7521
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7522
    __ vsubps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7523
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7524
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7525
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7526
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7527
instruct vsub16F_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7528
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7529
  match(Set dst (SubVF src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7530
  format %{ "vsubps  $dst,$src1,$src2\t! sub packed16F" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7531
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7532
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7533
    __ vsubps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7534
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7535
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7536
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7537
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7538
instruct vsub16F_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7539
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7540
  match(Set dst (SubVF src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7541
  format %{ "vsubps  $dst,$src,$mem\t! sub packed16F" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7542
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7543
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7544
    __ vsubps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7545
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7546
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7547
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7548
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7549
// Doubles vector sub
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7550
instruct vsub2D(vecX dst, vecX src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7551
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7552
  match(Set dst (SubVD dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7553
  format %{ "subpd   $dst,$src\t! sub packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7554
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7555
    __ subpd($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7556
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7557
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7558
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7559
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7560
instruct vsub2D_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7561
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7562
  match(Set dst (SubVD src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7563
  format %{ "vsubpd  $dst,$src1,$src2\t! sub packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7564
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7565
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7566
    __ vsubpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7567
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7568
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7569
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7570
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7571
instruct vsub2D_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7572
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7573
  match(Set dst (SubVD src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7574
  format %{ "vsubpd  $dst,$src,$mem\t! sub packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7575
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7576
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7577
    __ vsubpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7578
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7579
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7580
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7581
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7582
instruct vsub4D_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7583
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7584
  match(Set dst (SubVD src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7585
  format %{ "vsubpd  $dst,$src1,$src2\t! sub packed4D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7586
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7587
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7588
    __ vsubpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7589
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7590
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7591
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7592
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7593
instruct vsub4D_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7594
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7595
  match(Set dst (SubVD src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7596
  format %{ "vsubpd  $dst,$src,$mem\t! sub packed4D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7597
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7598
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7599
    __ vsubpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7600
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7601
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7602
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7603
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7604
instruct vsub8D_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7605
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7606
  match(Set dst (SubVD src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7607
  format %{ "vsubpd  $dst,$src1,$src2\t! sub packed8D" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7608
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7609
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7610
    __ vsubpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7611
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7612
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7613
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7614
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7615
instruct vsub8D_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7616
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7617
  match(Set dst (SubVD src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7618
  format %{ "vsubpd  $dst,$src,$mem\t! sub packed8D" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7619
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7620
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7621
    __ vsubpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7622
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7623
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7624
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7625
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7626
// --------------------------------- MUL --------------------------------------
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7627
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7628
// Shorts/Chars vector mul
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7629
instruct vmul2S(vecS dst, vecS src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7630
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7631
  match(Set dst (MulVS dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7632
  format %{ "pmullw $dst,$src\t! mul packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7633
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7634
    __ pmullw($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7635
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7636
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7637
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7638
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7639
instruct vmul2S_reg_avx(vecS dst, vecS src1, vecS src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7640
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7641
  match(Set dst (MulVS src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7642
  format %{ "vpmullw $dst,$src1,$src2\t! mul packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7643
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7644
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7645
    __ vpmullw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7646
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7647
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7648
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7649
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7650
instruct vmul2S_reg_evex(vecS dst, vecS src1, vecS src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7651
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7652
  match(Set dst (MulVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7653
  format %{ "vpmullw $dst,$src1,$src2\t! mul packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7654
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7655
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7656
    __ vpmullw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7657
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7658
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7659
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7660
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7661
instruct vmul2S_evex_special(vecS dst, vecS src1, vecS src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7662
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7663
  match(Set dst (MulVS dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7664
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7665
  format %{ "vpmullw $dst,$src1,$src2\t! mul packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7666
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7667
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7668
    __ vpmullw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7669
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7670
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7671
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7672
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7673
instruct vmul2S_mem_avx(vecS dst, vecS src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7674
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 2);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7675
  match(Set dst (MulVS src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7676
  format %{ "vpmullw $dst,$src,$mem\t! mul packed2S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7677
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7678
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7679
    __ vpmullw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7680
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7681
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7682
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7683
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7684
instruct vmul2S_mem_evex(vecS dst, vecS src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7685
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7686
  match(Set dst (MulVS src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7687
  format %{ "vpmullw $dst,$src,$mem\t! mul packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7688
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7689
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7690
    __ vpmullw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7691
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7692
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7693
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7694
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7695
instruct vmul2S_mem_evex_special(vecS dst, vecS src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7696
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7697
  match(Set dst (MulVS dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7698
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7699
  format %{ "vpmullw $dst,$src,$mem\t! mul packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7700
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7701
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7702
    __ vpmullw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7703
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7704
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7705
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7706
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7707
instruct vmul4S(vecD dst, vecD src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7708
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7709
  match(Set dst (MulVS dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7710
  format %{ "pmullw  $dst,$src\t! mul packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7711
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7712
    __ pmullw($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7713
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7714
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7715
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7716
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7717
instruct vmul4S_reg_avx(vecD dst, vecD src1, vecD src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7718
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7719
  match(Set dst (MulVS src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7720
  format %{ "vpmullw $dst,$src1,$src2\t! mul packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7721
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7722
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7723
    __ vpmullw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7724
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7725
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7726
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7727
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7728
instruct vmul4S_reg_evex(vecD dst, vecD src1, vecD src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7729
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7730
  match(Set dst (MulVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7731
  format %{ "vpmullw $dst,$src1,$src2\t! mul packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7732
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7733
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7734
    __ vpmullw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7735
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7736
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7737
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7738
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7739
instruct vmul4S_reg_evex_special(vecD dst, vecD src1, vecD src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7740
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7741
  match(Set dst (MulVS dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7742
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7743
  format %{ "vpmullw $dst,$src1,$src2\t! mul packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7744
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7745
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7746
    __ vpmullw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7747
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7748
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7749
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7750
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7751
instruct vmul4S_mem_avx(vecD dst, vecD src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7752
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 4);
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7753
  match(Set dst (MulVS src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7754
  format %{ "vpmullw $dst,$src,$mem\t! mul packed4S" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7755
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7756
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7757
    __ vpmullw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7758
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7759
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7760
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7761
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7762
instruct vmul4S_mem_evex(vecD dst, vecD src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7763
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7764
  match(Set dst (MulVS src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7765
  format %{ "vpmullw $dst,$src,$mem\t! mul packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7766
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7767
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7768
    __ vpmullw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7769
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7770
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7771
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7772
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7773
instruct vmul4S_mem_evex_special(vecD dst, vecD src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7774
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7775
  match(Set dst (MulVS dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7776
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7777
  format %{ "vpmullw $dst,$src,$mem\t! mul packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7778
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7779
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7780
    __ vpmullw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7781
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7782
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7783
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7784
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7785
instruct vmul8S(vecX dst, vecX src) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7786
  predicate(UseAVX == 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7787
  match(Set dst (MulVS dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7788
  format %{ "pmullw  $dst,$src\t! mul packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7789
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7790
    __ pmullw($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7791
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7792
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7793
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7794
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7795
instruct vmul8S_reg_avx(vecX dst, vecX src1, vecX src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7796
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7797
  match(Set dst (MulVS src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7798
  format %{ "vpmullw $dst,$src1,$src2\t! mul packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7799
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7800
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7801
    __ vpmullw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7802
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7803
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7804
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7805
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7806
instruct vmul8S_reg_evex(vecX dst, vecX src1, vecX src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7807
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7808
  match(Set dst (MulVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7809
  format %{ "vpmullw $dst,$src1,$src2\t! mul packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7810
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7811
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7812
    __ vpmullw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7813
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7814
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7815
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7816
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7817
instruct vmul8S_reg_evex_special(vecX dst, vecX src1, vecX src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7818
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7819
  match(Set dst (MulVS dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7820
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7821
  format %{ "vpmullw $dst,$src1,$src2\t! mul packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7822
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7823
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7824
    __ vpmullw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7825
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7826
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7827
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7828
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7829
instruct vmul8S_mem_avx(vecX dst, vecX src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7830
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7831
  match(Set dst (MulVS src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7832
  format %{ "vpmullw $dst,$src,$mem\t! mul packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7833
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7834
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7835
    __ vpmullw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7836
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7837
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7838
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7839
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7840
instruct vmul8S_mem_evex(vecX dst, vecX src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7841
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7842
  match(Set dst (MulVS src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7843
  format %{ "vpmullw $dst,$src,$mem\t! mul packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7844
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7845
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7846
    __ vpmullw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7847
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7848
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7849
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7850
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7851
instruct vmul8S_mem_evex_special(vecX dst, vecX src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7852
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7853
  match(Set dst (MulVS dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7854
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7855
  format %{ "vpmullw $dst,$src,$mem\t! mul packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7856
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7857
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7858
    __ vpmullw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7859
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7860
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7861
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7862
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7863
instruct vmul16S_reg_avx(vecY dst, vecY src1, vecY src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7864
  predicate(VM_Version::supports_avx256only() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7865
  match(Set dst (MulVS src1 src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7866
  format %{ "vpmullw $dst,$src1,$src2\t! mul packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7867
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7868
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7869
    __ vpmullw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7870
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7871
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7872
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7873
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7874
instruct vmul16S_reg_evex(vecY dst, vecY src1, vecY src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7875
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7876
  match(Set dst (MulVS src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7877
  format %{ "vpmullw $dst,$src1,$src2\t! mul packed16S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7878
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7879
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7880
    __ vpmullw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7881
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7882
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7883
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7884
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7885
instruct vmul16S_reg_evex_special(vecY dst, vecY src1, vecY src2) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7886
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7887
  match(Set dst (MulVS dst src2));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7888
  effect(TEMP src1);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7889
  format %{ "vpmullw $dst,$src1,$src2\t! mul packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7890
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7891
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7892
    __ vpmullw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7893
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7894
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7895
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7896
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7897
instruct vmul16S_mem_avx(vecY dst, vecY src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7898
  predicate(VM_Version::supports_avx256only() && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7899
  match(Set dst (MulVS src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7900
  format %{ "vpmullw $dst,$src,$mem\t! mul packed16S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7901
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7902
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7903
    __ vpmullw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7904
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7905
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7906
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7907
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7908
instruct vmul16S_mem_evex(vecY dst, vecY src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7909
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7910
  match(Set dst (MulVS src (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7911
  format %{ "vpmullw $dst,$src,$mem\t! mul packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7912
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7913
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7914
    __ vpmullw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7915
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7916
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7917
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7918
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7919
instruct vmul16S_mem_evex_special(vecY dst, vecY src, memory mem) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7920
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7921
  match(Set dst (MulVS dst (LoadVector mem)));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7922
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7923
  format %{ "vpmullw $dst,$src,$mem\t! mul packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7924
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7925
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7926
    __ vpmullw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7927
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7928
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7929
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7930
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7931
instruct vmul32S_reg(vecZ dst, vecZ src1, vecZ src2) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7932
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7933
  match(Set dst (MulVS src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7934
  format %{ "vpmullw $dst,$src1,$src2\t! mul packed32S" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7935
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7936
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7937
    __ vpmullw($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7938
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7939
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7940
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7941
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7942
instruct vmul32S_mem(vecZ dst, vecZ src, memory mem) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  7943
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7944
  match(Set dst (MulVS src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7945
  format %{ "vpmullw $dst,$src,$mem\t! mul packed32S" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7946
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7947
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7948
    __ vpmullw($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7949
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7950
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7951
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7952
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7953
// Integers vector mul (sse4_1)
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7954
instruct vmul2I(vecD dst, vecD src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7955
  predicate(UseSSE > 3 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7956
  match(Set dst (MulVI dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7957
  format %{ "pmulld  $dst,$src\t! mul packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7958
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7959
    __ pmulld($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7960
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7961
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7962
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7963
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7964
instruct vmul2I_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7965
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7966
  match(Set dst (MulVI src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7967
  format %{ "vpmulld $dst,$src1,$src2\t! mul packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7968
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7969
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7970
    __ vpmulld($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7971
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7972
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7973
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  7974
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7975
instruct vmul2I_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7976
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7977
  match(Set dst (MulVI src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7978
  format %{ "vpmulld $dst,$src,$mem\t! mul packed2I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7979
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7980
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  7981
    __ vpmulld($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7982
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7983
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7984
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7985
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7986
instruct vmul4I(vecX dst, vecX src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7987
  predicate(UseSSE > 3 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7988
  match(Set dst (MulVI dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7989
  format %{ "pmulld  $dst,$src\t! mul packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7990
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7991
    __ pmulld($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7992
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7993
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7994
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7995
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7996
instruct vmul4I_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7997
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7998
  match(Set dst (MulVI src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  7999
  format %{ "vpmulld $dst,$src1,$src2\t! mul packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8000
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8001
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8002
    __ vpmulld($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8003
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8004
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8005
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8006
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8007
instruct vmul4I_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8008
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8009
  match(Set dst (MulVI src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8010
  format %{ "vpmulld $dst,$src,$mem\t! mul packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8011
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8012
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8013
    __ vpmulld($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8014
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8015
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8016
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8017
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8018
instruct vmul2L_reg(vecX dst, vecX src1, vecX src2) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8019
  predicate(UseAVX > 2 && n->as_Vector()->length() == 2 && VM_Version::supports_avx512dq());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8020
  match(Set dst (MulVL src1 src2));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8021
  format %{ "vpmullq $dst,$src1,$src2\t! mul packed2L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8022
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8023
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8024
    __ vpmullq($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8025
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8026
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8027
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8028
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8029
instruct vmul2L_mem(vecX dst, vecX src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8030
  predicate(UseAVX > 2 && n->as_Vector()->length() == 2 && VM_Version::supports_avx512dq());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8031
  match(Set dst (MulVL src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8032
  format %{ "vpmullq $dst,$src,$mem\t! mul packed2L" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8033
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8034
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8035
    __ vpmullq($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8036
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8037
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8038
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8039
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8040
instruct vmul4L_reg(vecY dst, vecY src1, vecY src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8041
  predicate(UseAVX > 2 && n->as_Vector()->length() == 4 && VM_Version::supports_avx512dq());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8042
  match(Set dst (MulVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8043
  format %{ "vpmullq $dst,$src1,$src2\t! mul packed4L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8044
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8045
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8046
    __ vpmullq($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8047
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8048
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8049
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8050
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8051
instruct vmul4L_mem(vecY dst, vecY src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8052
  predicate(UseAVX > 2 && n->as_Vector()->length() == 4 && VM_Version::supports_avx512dq());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8053
  match(Set dst (MulVL src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8054
  format %{ "vpmullq $dst,$src,$mem\t! mul packed4L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8055
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8056
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8057
    __ vpmullq($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8058
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8059
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8060
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8061
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8062
instruct vmul8L_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8063
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8 && VM_Version::supports_avx512dq());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8064
  match(Set dst (MulVL src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8065
  format %{ "vpmullq $dst,$src1,$src2\t! mul packed8L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8066
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8067
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8068
    __ vpmullq($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8069
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8070
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8071
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8072
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8073
instruct vmul8L_mem(vecZ dst, vecZ src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8074
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8 && VM_Version::supports_avx512dq());
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8075
  match(Set dst (MulVL src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8076
  format %{ "vpmullq $dst,$src,$mem\t! mul packed8L" %}
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8077
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8078
    int vector_len = 2;
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8079
    __ vpmullq($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8080
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8081
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8082
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8083
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8084
instruct vmul8I_reg(vecY dst, vecY src1, vecY src2) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8085
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8086
  match(Set dst (MulVI src1 src2));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8087
  format %{ "vpmulld $dst,$src1,$src2\t! mul packed8I" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8088
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8089
    int vector_len = 1;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8090
    __ vpmulld($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8091
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8092
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8093
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8094
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8095
instruct vmul8I_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8096
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8097
  match(Set dst (MulVI src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8098
  format %{ "vpmulld $dst,$src,$mem\t! mul packed8I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8099
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8100
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8101
    __ vpmulld($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8102
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8103
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8104
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8105
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8106
instruct vmul16I_reg(vecZ dst, vecZ src1, vecZ src2) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8107
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8108
  match(Set dst (MulVI src1 src2));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8109
  format %{ "vpmulld $dst,$src1,$src2\t! mul packed16I" %}
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8110
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8111
    int vector_len = 2;
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8112
    __ vpmulld($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8113
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8114
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8115
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8116
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8117
instruct vmul16I_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8118
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8119
  match(Set dst (MulVI src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8120
  format %{ "vpmulld $dst,$src,$mem\t! mul packed16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8121
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8122
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8123
    __ vpmulld($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8124
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8125
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8126
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8127
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8128
// Floats vector mul
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8129
instruct vmul2F(vecD dst, vecD src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8130
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8131
  match(Set dst (MulVF dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8132
  format %{ "mulps   $dst,$src\t! mul packed2F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8133
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8134
    __ mulps($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8135
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8136
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8137
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8138
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8139
instruct vmul2F_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8140
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8141
  match(Set dst (MulVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8142
  format %{ "vmulps  $dst,$src1,$src2\t! mul packed2F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8143
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8144
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8145
    __ vmulps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8146
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8147
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8148
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8149
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8150
instruct vmul2F_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8151
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8152
  match(Set dst (MulVF src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8153
  format %{ "vmulps  $dst,$src,$mem\t! mul packed2F" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8154
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8155
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8156
    __ vmulps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8157
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8158
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8159
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8160
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8161
instruct vmul4F(vecX dst, vecX src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8162
  predicate(n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8163
  match(Set dst (MulVF dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8164
  format %{ "mulps   $dst,$src\t! mul packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8165
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8166
    __ mulps($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8167
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8168
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8169
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8170
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8171
instruct vmul4F_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8172
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8173
  match(Set dst (MulVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8174
  format %{ "vmulps  $dst,$src1,$src2\t! mul packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8175
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8176
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8177
    __ vmulps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8178
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8179
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8180
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8181
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8182
instruct vmul4F_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8183
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8184
  match(Set dst (MulVF src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8185
  format %{ "vmulps  $dst,$src,$mem\t! mul packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8186
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8187
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8188
    __ vmulps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8189
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8190
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8191
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8192
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8193
instruct vmul8F_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8194
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8195
  match(Set dst (MulVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8196
  format %{ "vmulps  $dst,$src1,$src2\t! mul packed8F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8197
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8198
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8199
    __ vmulps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8200
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8201
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8202
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8203
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8204
instruct vmul8F_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8205
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8206
  match(Set dst (MulVF src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8207
  format %{ "vmulps  $dst,$src,$mem\t! mul packed8F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8208
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8209
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8210
    __ vmulps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8211
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8212
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8213
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8214
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8215
instruct vmul16F_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8216
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8217
  match(Set dst (MulVF src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8218
  format %{ "vmulps  $dst,$src1,$src2\t! mul packed16F" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8219
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8220
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8221
    __ vmulps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8222
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8223
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8224
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8225
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8226
instruct vmul16F_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8227
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8228
  match(Set dst (MulVF src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8229
  format %{ "vmulps  $dst,$src,$mem\t! mul packed16F" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8230
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8231
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8232
    __ vmulps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8233
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8234
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8235
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8236
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8237
// Doubles vector mul
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8238
instruct vmul2D(vecX dst, vecX src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8239
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8240
  match(Set dst (MulVD dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8241
  format %{ "mulpd   $dst,$src\t! mul packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8242
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8243
    __ mulpd($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8244
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8245
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8246
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8247
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8248
instruct vmul2D_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8249
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8250
  match(Set dst (MulVD src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8251
  format %{ "vmulpd  $dst,$src1,$src2\t! mul packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8252
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8253
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8254
    __ vmulpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8255
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8256
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8257
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8258
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8259
instruct vmul2D_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8260
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8261
  match(Set dst (MulVD src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8262
  format %{ "vmulpd  $dst,$src,$mem\t! mul packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8263
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8264
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8265
    __ vmulpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8266
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8267
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8268
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8269
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8270
instruct vmul4D_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8271
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8272
  match(Set dst (MulVD src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8273
  format %{ "vmulpd  $dst,$src1,$src2\t! mul packed4D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8274
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8275
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8276
    __ vmulpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8277
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8278
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8279
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8280
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8281
instruct vmul4D_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8282
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8283
  match(Set dst (MulVD src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8284
  format %{ "vmulpd  $dst,$src,$mem\t! mul packed4D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8285
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8286
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8287
    __ vmulpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8288
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8289
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8290
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8291
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8292
instruct vmul8D_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8293
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8294
  match(Set dst (MulVD src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8295
  format %{ "vmulpd  $dst k0,$src1,$src2\t! mul packed8D" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8296
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8297
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8298
    __ vmulpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8299
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8300
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8301
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8302
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8303
instruct vmul8D_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8304
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8305
  match(Set dst (MulVD src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8306
  format %{ "vmulpd  $dst k0,$src,$mem\t! mul packed8D" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8307
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8308
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8309
    __ vmulpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8310
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8311
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8312
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8313
48309
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  8314
instruct vcmov8F_reg(vecY dst, vecY src1, vecY src2, immI8 cop, cmpOp_vcmppd copnd) %{
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  8315
  predicate(UseAVX > 0 && UseAVX < 3 && n->as_Vector()->length() == 8);
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  8316
  match(Set dst (CMoveVF (Binary copnd cop) (Binary src1 src2)));
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  8317
  effect(TEMP dst, USE src1, USE src2);
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  8318
  format %{ "cmpps.$copnd  $dst, $src1, $src2  ! vcmovevf, cond=$cop\n\t"
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  8319
            "blendvps $dst,$src1,$src2,$dst ! vcmovevf\n\t"
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  8320
         %}
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  8321
  ins_encode %{
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  8322
    int vector_len = 1;
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  8323
    int cond = (Assembler::Condition)($copnd$$cmpcode);
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  8324
    __ cmpps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, cond, vector_len);
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  8325
    __ blendvps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, $dst$$XMMRegister, vector_len);
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  8326
  %}
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  8327
  ins_pipe( pipe_slow );
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  8328
%}
1a0499fd252e 8192846: Support cmov vectorization for float
kvn
parents: 48089
diff changeset
  8329
33469
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  8330
instruct vcmov4D_reg(vecY dst, vecY src1, vecY src2, immI8 cop, cmpOp_vcmppd copnd) %{
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  8331
  predicate(UseAVX > 0 && UseAVX < 3 && n->as_Vector()->length() == 4);
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  8332
  match(Set dst (CMoveVD (Binary copnd cop) (Binary src1 src2)));
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  8333
  effect(TEMP dst, USE src1, USE src2);
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  8334
  format %{ "cmppd.$copnd  $dst, $src1, $src2  ! vcmovevd, cond=$cop\n\t"
42039
db627462f2c9 8165381: Update for x86 SHA512 using AVX2
kvn
parents: 41333
diff changeset
  8335
            "blendvpd $dst,$src1,$src2,$dst ! vcmovevd\n\t"
33469
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  8336
         %}
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  8337
  ins_encode %{
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  8338
    int vector_len = 1;
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  8339
    int cond = (Assembler::Condition)($copnd$$cmpcode);
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  8340
    __ cmppd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, cond, vector_len);
42039
db627462f2c9 8165381: Update for x86 SHA512 using AVX2
kvn
parents: 41333
diff changeset
  8341
    __ blendvpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, $dst$$XMMRegister, vector_len);
33469
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  8342
  %}
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  8343
  ins_pipe( pipe_slow );
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  8344
%}
30f4811eded0 8139340: SuperWord enhancement to support vector conditional move (CMovVD) on Intel AVX cpu
iveresov
parents: 33065
diff changeset
  8345
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8346
// --------------------------------- DIV --------------------------------------
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8347
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8348
// Floats vector div
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8349
instruct vdiv2F(vecD dst, vecD src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8350
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8351
  match(Set dst (DivVF dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8352
  format %{ "divps   $dst,$src\t! div packed2F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8353
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8354
    __ divps($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8355
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8356
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8357
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8358
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8359
instruct vdiv2F_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8360
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8361
  match(Set dst (DivVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8362
  format %{ "vdivps  $dst,$src1,$src2\t! div packed2F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8363
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8364
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8365
    __ vdivps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8366
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8367
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8368
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8369
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8370
instruct vdiv2F_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8371
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8372
  match(Set dst (DivVF src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8373
  format %{ "vdivps  $dst,$src,$mem\t! div packed2F" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8374
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8375
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8376
    __ vdivps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8377
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8378
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8379
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
  8380
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8381
instruct vdiv4F(vecX dst, vecX src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8382
  predicate(n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8383
  match(Set dst (DivVF dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8384
  format %{ "divps   $dst,$src\t! div packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8385
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8386
    __ divps($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8387
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8388
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8389
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8390
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8391
instruct vdiv4F_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8392
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8393
  match(Set dst (DivVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8394
  format %{ "vdivps  $dst,$src1,$src2\t! div packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8395
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8396
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8397
    __ vdivps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8398
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8399
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8400
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8401
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8402
instruct vdiv4F_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8403
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8404
  match(Set dst (DivVF src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8405
  format %{ "vdivps  $dst,$src,$mem\t! div packed4F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8406
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8407
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8408
    __ vdivps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8409
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8410
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8411
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8412
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8413
instruct vdiv8F_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8414
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8415
  match(Set dst (DivVF src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8416
  format %{ "vdivps  $dst,$src1,$src2\t! div packed8F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8417
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8418
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8419
    __ vdivps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8420
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8421
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8422
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8423
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8424
instruct vdiv8F_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8425
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8426
  match(Set dst (DivVF src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8427
  format %{ "vdivps  $dst,$src,$mem\t! div packed8F" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8428
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8429
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8430
    __ vdivps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8431
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8432
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8433
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8434
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8435
instruct vdiv16F_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8436
  predicate(UseAVX > 0 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8437
  match(Set dst (DivVF src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8438
  format %{ "vdivps  $dst,$src1,$src2\t! div packed16F" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8439
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8440
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8441
    __ vdivps($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8442
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8443
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8444
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8445
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8446
instruct vdiv16F_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8447
  predicate(UseAVX > 0 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8448
  match(Set dst (DivVF src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8449
  format %{ "vdivps  $dst,$src,$mem\t! div packed16F" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8450
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8451
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8452
    __ vdivps($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8453
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8454
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8455
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8456
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8457
// Doubles vector div
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8458
instruct vdiv2D(vecX dst, vecX src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8459
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8460
  match(Set dst (DivVD dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8461
  format %{ "divpd   $dst,$src\t! div packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8462
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8463
    __ divpd($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8464
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8465
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8466
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8467
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8468
instruct vdiv2D_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8469
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8470
  match(Set dst (DivVD src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8471
  format %{ "vdivpd  $dst,$src1,$src2\t! div packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8472
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8473
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8474
    __ vdivpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8475
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8476
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8477
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8478
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8479
instruct vdiv2D_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8480
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8481
  match(Set dst (DivVD src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8482
  format %{ "vdivpd  $dst,$src,$mem\t! div packed2D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8483
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8484
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8485
    __ vdivpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8486
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8487
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8488
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8489
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8490
instruct vdiv4D_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8491
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8492
  match(Set dst (DivVD src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8493
  format %{ "vdivpd  $dst,$src1,$src2\t! div packed4D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8494
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8495
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8496
    __ vdivpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8497
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8498
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8499
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8500
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8501
instruct vdiv4D_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8502
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8503
  match(Set dst (DivVD src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8504
  format %{ "vdivpd  $dst,$src,$mem\t! div packed4D" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8505
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8506
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8507
    __ vdivpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8508
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8509
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8510
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8511
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8512
instruct vdiv8D_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8513
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8514
  match(Set dst (DivVD src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8515
  format %{ "vdivpd  $dst,$src1,$src2\t! div packed8D" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8516
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8517
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8518
    __ vdivpd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8519
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8520
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8521
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8522
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8523
instruct vdiv8D_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8524
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8525
  match(Set dst (DivVD src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8526
  format %{ "vdivpd  $dst,$src,$mem\t! div packed8D" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8527
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8528
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8529
    __ vdivpd($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8530
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8531
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8532
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8533
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  8534
// ------------------------------ Shift ---------------------------------------
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  8535
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  8536
// Left and right shift count vectors are the same on x86
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  8537
// (only lowest bits of xmm reg are used for count).
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  8538
instruct vshiftcnt(vecS dst, rRegI cnt) %{
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  8539
  match(Set dst (LShiftCntV cnt));
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  8540
  match(Set dst (RShiftCntV cnt));
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  8541
  format %{ "movd    $dst,$cnt\t! load shift count" %}
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  8542
  ins_encode %{
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  8543
    __ movdl($dst$$XMMRegister, $cnt$$Register);
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  8544
  %}
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  8545
  ins_pipe( pipe_slow );
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  8546
%}
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  8547
32723
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8548
// --------------------------------- Sqrt --------------------------------------
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8549
48089
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8550
// Floating point vector sqrt
32723
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8551
instruct vsqrt2D_reg(vecX dst, vecX src) %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8552
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8553
  match(Set dst (SqrtVD src));
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8554
  format %{ "vsqrtpd  $dst,$src\t! sqrt packed2D" %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8555
  ins_encode %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8556
    int vector_len = 0;
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8557
    __ vsqrtpd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8558
  %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8559
  ins_pipe( pipe_slow );
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8560
%}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8561
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8562
instruct vsqrt2D_mem(vecX dst, memory mem) %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8563
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8564
  match(Set dst (SqrtVD (LoadVector mem)));
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8565
  format %{ "vsqrtpd  $dst,$mem\t! sqrt packed2D" %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8566
  ins_encode %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8567
    int vector_len = 0;
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8568
    __ vsqrtpd($dst$$XMMRegister, $mem$$Address, vector_len);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8569
  %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8570
  ins_pipe( pipe_slow );
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8571
%}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8572
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8573
instruct vsqrt4D_reg(vecY dst, vecY src) %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8574
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8575
  match(Set dst (SqrtVD src));
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8576
  format %{ "vsqrtpd  $dst,$src\t! sqrt packed4D" %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8577
  ins_encode %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8578
    int vector_len = 1;
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8579
    __ vsqrtpd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8580
  %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8581
  ins_pipe( pipe_slow );
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8582
%}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8583
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8584
instruct vsqrt4D_mem(vecY dst, memory mem) %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8585
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8586
  match(Set dst (SqrtVD (LoadVector mem)));
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8587
  format %{ "vsqrtpd  $dst,$mem\t! sqrt packed4D" %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8588
  ins_encode %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8589
    int vector_len = 1;
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8590
    __ vsqrtpd($dst$$XMMRegister, $mem$$Address, vector_len);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8591
  %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8592
  ins_pipe( pipe_slow );
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8593
%}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8594
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8595
instruct vsqrt8D_reg(vecZ dst, vecZ src) %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8596
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8597
  match(Set dst (SqrtVD src));
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8598
  format %{ "vsqrtpd  $dst,$src\t! sqrt packed8D" %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8599
  ins_encode %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8600
    int vector_len = 2;
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8601
    __ vsqrtpd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8602
  %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8603
  ins_pipe( pipe_slow );
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8604
%}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8605
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8606
instruct vsqrt8D_mem(vecZ dst, memory mem) %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8607
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8608
  match(Set dst (SqrtVD (LoadVector mem)));
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8609
  format %{ "vsqrtpd  $dst,$mem\t! sqrt packed8D" %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8610
  ins_encode %{
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8611
    int vector_len = 2;
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8612
    __ vsqrtpd($dst$$XMMRegister, $mem$$Address, vector_len);
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8613
  %}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8614
  ins_pipe( pipe_slow );
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8615
%}
56534fb3d71a 8135028: support for vectorizing double precision sqrt
mcberg
parents: 32082
diff changeset
  8616
48089
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8617
instruct vsqrt2F_reg(vecD dst, vecD src) %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8618
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8619
  match(Set dst (SqrtVF src));
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8620
  format %{ "vsqrtps  $dst,$src\t! sqrt packed2F" %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8621
  ins_encode %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8622
    int vector_len = 0;
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8623
    __ vsqrtps($dst$$XMMRegister, $src$$XMMRegister, vector_len);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8624
  %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8625
  ins_pipe( pipe_slow );
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8626
%}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8627
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8628
instruct vsqrt2F_mem(vecD dst, memory mem) %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8629
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8630
  match(Set dst (SqrtVF (LoadVector mem)));
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8631
  format %{ "vsqrtps  $dst,$mem\t! sqrt packed2F" %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8632
  ins_encode %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8633
    int vector_len = 0;
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8634
    __ vsqrtps($dst$$XMMRegister, $mem$$Address, vector_len);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8635
  %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8636
  ins_pipe( pipe_slow );
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8637
%}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8638
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8639
instruct vsqrt4F_reg(vecX dst, vecX src) %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8640
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8641
  match(Set dst (SqrtVF src));
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8642
  format %{ "vsqrtps  $dst,$src\t! sqrt packed4F" %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8643
  ins_encode %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8644
    int vector_len = 0;
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8645
    __ vsqrtps($dst$$XMMRegister, $src$$XMMRegister, vector_len);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8646
  %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8647
  ins_pipe( pipe_slow );
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8648
%}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8649
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8650
instruct vsqrt4F_mem(vecX dst, memory mem) %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8651
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8652
  match(Set dst (SqrtVF (LoadVector mem)));
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8653
  format %{ "vsqrtps  $dst,$mem\t! sqrt packed4F" %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8654
  ins_encode %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8655
    int vector_len = 0;
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8656
    __ vsqrtps($dst$$XMMRegister, $mem$$Address, vector_len);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8657
  %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8658
  ins_pipe( pipe_slow );
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8659
%}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8660
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8661
instruct vsqrt8F_reg(vecY dst, vecY src) %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8662
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8663
  match(Set dst (SqrtVF src));
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8664
  format %{ "vsqrtps  $dst,$src\t! sqrt packed8F" %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8665
  ins_encode %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8666
    int vector_len = 1;
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8667
    __ vsqrtps($dst$$XMMRegister, $src$$XMMRegister, vector_len);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8668
  %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8669
  ins_pipe( pipe_slow );
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8670
%}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8671
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8672
instruct vsqrt8F_mem(vecY dst, memory mem) %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8673
  predicate(UseAVX > 0 && n->as_Vector()->length() == 8);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8674
  match(Set dst (SqrtVF (LoadVector mem)));
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8675
  format %{ "vsqrtps  $dst,$mem\t! sqrt packed8F" %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8676
  ins_encode %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8677
    int vector_len = 1;
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8678
    __ vsqrtps($dst$$XMMRegister, $mem$$Address, vector_len);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8679
  %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8680
  ins_pipe( pipe_slow );
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8681
%}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8682
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8683
instruct vsqrt16F_reg(vecZ dst, vecZ src) %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8684
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8685
  match(Set dst (SqrtVF src));
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8686
  format %{ "vsqrtps  $dst,$src\t! sqrt packed16F" %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8687
  ins_encode %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8688
    int vector_len = 2;
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8689
    __ vsqrtps($dst$$XMMRegister, $src$$XMMRegister, vector_len);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8690
  %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8691
  ins_pipe( pipe_slow );
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8692
%}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8693
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8694
instruct vsqrt16F_mem(vecZ dst, memory mem) %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8695
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8696
  match(Set dst (SqrtVF (LoadVector mem)));
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8697
  format %{ "vsqrtps  $dst,$mem\t! sqrt packed16F" %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8698
  ins_encode %{
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8699
    int vector_len = 2;
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8700
    __ vsqrtps($dst$$XMMRegister, $mem$$Address, vector_len);
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8701
  %}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8702
  ins_pipe( pipe_slow );
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8703
%}
22c9856fc2c2 8190800: Support vectorization of Math.sqrt() on floats
rlupusoru
parents: 47216
diff changeset
  8704
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8705
// ------------------------------ LeftShift -----------------------------------
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8706
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8707
// Shorts/Chars vector left shift
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  8708
instruct vsll2S(vecS dst, vecS shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8709
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8710
  match(Set dst (LShiftVS dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8711
  format %{ "psllw   $dst,$shift\t! left shift packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8712
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8713
    __ psllw($dst$$XMMRegister, $shift$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8714
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8715
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8716
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8717
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8718
instruct vsll2S_imm(vecS dst, immI8 shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8719
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8720
  match(Set dst (LShiftVS dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8721
  format %{ "psllw   $dst,$shift\t! left shift packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8722
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8723
    __ psllw($dst$$XMMRegister, (int)$shift$$constant);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8724
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8725
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8726
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8727
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8728
instruct vsll2S_reg_avx(vecS dst, vecS src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8729
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8730
  match(Set dst (LShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8731
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8732
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8733
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8734
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8735
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8736
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8737
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8738
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8739
instruct vsll2S_reg_evex(vecS dst, vecS src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8740
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8741
  match(Set dst (LShiftVS src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8742
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8743
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8744
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8745
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8746
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8747
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8748
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8749
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8750
instruct vsll2S_reg_evex_special(vecS dst, vecS src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8751
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8752
  match(Set dst (LShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8753
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8754
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8755
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8756
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8757
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8758
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8759
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8760
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8761
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8762
instruct vsll2S_reg_imm_avx(vecS dst, vecS src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8763
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8764
  match(Set dst (LShiftVS src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8765
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8766
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8767
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8768
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8769
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8770
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8771
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8772
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8773
instruct vsll2S_reg_imm_evex(vecS dst, vecS src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8774
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8775
  match(Set dst (LShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8776
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8777
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8778
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8779
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8780
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8781
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8782
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8783
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8784
instruct vsll2S_reg_imm_evex_special(vecS dst, vecS src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8785
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8786
  match(Set dst (LShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8787
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8788
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8789
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8790
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8791
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8792
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8793
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8794
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8795
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  8796
instruct vsll4S(vecD dst, vecS shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8797
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8798
  match(Set dst (LShiftVS dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8799
  format %{ "psllw   $dst,$shift\t! left shift packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8800
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8801
    __ psllw($dst$$XMMRegister, $shift$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8802
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8803
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8804
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8805
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8806
instruct vsll4S_imm(vecD dst, immI8 shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8807
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8808
  match(Set dst (LShiftVS dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8809
  format %{ "psllw   $dst,$shift\t! left shift packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8810
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8811
    __ psllw($dst$$XMMRegister, (int)$shift$$constant);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8812
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8813
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8814
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8815
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8816
instruct vsll4S_reg_avx(vecD dst, vecD src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8817
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8818
  match(Set dst (LShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8819
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8820
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8821
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8822
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8823
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8824
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8825
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8826
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8827
instruct vsll4S_reg_evex(vecD dst, vecD src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8828
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8829
  match(Set dst (LShiftVS src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8830
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8831
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8832
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8833
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8834
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8835
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8836
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8837
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8838
instruct vsll4S_reg_evex_special(vecD dst, vecD src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8839
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8840
  match(Set dst (LShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8841
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8842
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8843
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8844
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8845
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8846
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8847
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8848
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8849
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8850
instruct vsll4S_reg_imm_avx(vecD dst, vecD src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8851
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8852
  match(Set dst (LShiftVS src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8853
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8854
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8855
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8856
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8857
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8858
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8859
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8860
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8861
instruct vsll4S_reg_imm_evex(vecD dst, vecD src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8862
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8863
  match(Set dst (LShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8864
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8865
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8866
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8867
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8868
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8869
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8870
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8871
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8872
instruct vsll4S_reg_imm_evex_special(vecD dst, vecD src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8873
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8874
  match(Set dst (LShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8875
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8876
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8877
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8878
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8879
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8880
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8881
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8882
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8883
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  8884
instruct vsll8S(vecX dst, vecS shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8885
  predicate(UseAVX == 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8886
  match(Set dst (LShiftVS dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8887
  format %{ "psllw   $dst,$shift\t! left shift packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8888
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8889
    __ psllw($dst$$XMMRegister, $shift$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8890
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8891
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8892
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8893
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8894
instruct vsll8S_imm(vecX dst, immI8 shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8895
  predicate(UseAVX == 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8896
  match(Set dst (LShiftVS dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8897
  format %{ "psllw   $dst,$shift\t! left shift packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8898
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8899
    __ psllw($dst$$XMMRegister, (int)$shift$$constant);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8900
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8901
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8902
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8903
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8904
instruct vsll8S_reg_avx(vecX dst, vecX src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8905
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8906
  match(Set dst (LShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8907
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8908
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8909
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8910
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8911
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8912
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8913
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8914
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8915
instruct vsll8S_reg_evex(vecX dst, vecX src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8916
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8917
  match(Set dst (LShiftVS src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8918
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8919
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8920
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8921
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8922
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8923
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8924
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8925
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8926
instruct vsll8S_reg_evex_special(vecX dst, vecX src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8927
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8928
  match(Set dst (LShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8929
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8930
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8931
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8932
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8933
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8934
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8935
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8936
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8937
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8938
instruct vsll8S_reg_imm_avx(vecX dst, vecX src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8939
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8940
  match(Set dst (LShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8941
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8942
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8943
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8944
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8945
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8946
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8947
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8948
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8949
instruct vsll8S_reg_imm_evex(vecX dst, vecX src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8950
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8951
  match(Set dst (LShiftVS src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8952
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8953
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8954
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8955
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8956
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8957
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8958
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8959
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8960
instruct vsll8S_reg_imm_evex_special(vecX dst, vecX src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8961
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8962
  match(Set dst (LShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8963
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8964
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8965
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8966
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8967
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8968
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8969
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8970
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8971
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8972
instruct vsll16S_reg_avx(vecY dst, vecY src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8973
  predicate(VM_Version::supports_avx256only() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8974
  match(Set dst (LShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8975
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8976
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8977
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8978
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8979
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8980
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8981
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8982
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8983
instruct vsll16S_reg_evex(vecY dst, vecY src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8984
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8985
  match(Set dst (LShiftVS src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8986
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed16S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8987
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8988
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  8989
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8990
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8991
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8992
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  8993
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8994
instruct vsll16S_reg_evex_special(vecY dst, vecY src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8995
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8996
  match(Set dst (LShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8997
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8998
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  8999
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9000
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9001
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9002
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9003
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9004
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9005
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9006
instruct vsll16S_reg_imm_avx(vecY dst, vecY src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9007
  predicate(VM_Version::supports_avx256only() && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9008
  match(Set dst (LShiftVS src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9009
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed16S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9010
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9011
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9012
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9013
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9014
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9015
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9016
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9017
instruct vsll16S_reg_imm_evex(vecY dst, vecY src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9018
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9019
  match(Set dst (LShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9020
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9021
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9022
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9023
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9024
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9025
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9026
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9027
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9028
instruct vsll16S_reg_imm_evex_special(vecY dst, vecY src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9029
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9030
  match(Set dst (LShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9031
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9032
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9033
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9034
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9035
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9036
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9037
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9038
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9039
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9040
instruct vsll32S_reg(vecZ dst, vecZ src, vecS shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9041
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9042
  match(Set dst (LShiftVS src shift));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9043
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed32S" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9044
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9045
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9046
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9047
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9048
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9049
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9050
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9051
instruct vsll32S_reg_imm(vecZ dst, vecZ src, immI8 shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9052
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9053
  match(Set dst (LShiftVS src shift));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9054
  format %{ "vpsllw  $dst,$src,$shift\t! left shift packed32S" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9055
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9056
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9057
    __ vpsllw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9058
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9059
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9060
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9061
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9062
// Integers vector left shift
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  9063
instruct vsll2I(vecD dst, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9064
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9065
  match(Set dst (LShiftVI dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9066
  format %{ "pslld   $dst,$shift\t! left shift packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9067
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9068
    __ pslld($dst$$XMMRegister, $shift$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9069
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9070
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9071
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9072
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9073
instruct vsll2I_imm(vecD dst, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9074
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9075
  match(Set dst (LShiftVI dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9076
  format %{ "pslld   $dst,$shift\t! left shift packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9077
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9078
    __ pslld($dst$$XMMRegister, (int)$shift$$constant);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9079
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9080
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9081
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9082
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  9083
instruct vsll2I_reg(vecD dst, vecD src, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9084
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9085
  match(Set dst (LShiftVI src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9086
  format %{ "vpslld  $dst,$src,$shift\t! left shift packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9087
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9088
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9089
    __ vpslld($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9090
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9091
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9092
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9093
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9094
instruct vsll2I_reg_imm(vecD dst, vecD src, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9095
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9096
  match(Set dst (LShiftVI src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9097
  format %{ "vpslld  $dst,$src,$shift\t! left shift packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9098
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9099
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9100
    __ vpslld($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9101
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9102
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9103
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9104
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  9105
instruct vsll4I(vecX dst, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9106
  predicate(n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9107
  match(Set dst (LShiftVI dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9108
  format %{ "pslld   $dst,$shift\t! left shift packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9109
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9110
    __ pslld($dst$$XMMRegister, $shift$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9111
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9112
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9113
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9114
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9115
instruct vsll4I_imm(vecX dst, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9116
  predicate(n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9117
  match(Set dst (LShiftVI dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9118
  format %{ "pslld   $dst,$shift\t! left shift packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9119
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9120
    __ pslld($dst$$XMMRegister, (int)$shift$$constant);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9121
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9122
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9123
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9124
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  9125
instruct vsll4I_reg(vecX dst, vecX src, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9126
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9127
  match(Set dst (LShiftVI src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9128
  format %{ "vpslld  $dst,$src,$shift\t! left shift packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9129
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9130
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9131
    __ vpslld($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9132
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9133
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9134
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9135
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9136
instruct vsll4I_reg_imm(vecX dst, vecX src, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9137
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9138
  match(Set dst (LShiftVI src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9139
  format %{ "vpslld  $dst,$src,$shift\t! left shift packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9140
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9141
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9142
    __ vpslld($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9143
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9144
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9145
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9146
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  9147
instruct vsll8I_reg(vecY dst, vecY src, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9148
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9149
  match(Set dst (LShiftVI src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9150
  format %{ "vpslld  $dst,$src,$shift\t! left shift packed8I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9151
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9152
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9153
    __ vpslld($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9154
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9155
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9156
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9157
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9158
instruct vsll8I_reg_imm(vecY dst, vecY src, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9159
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9160
  match(Set dst (LShiftVI src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9161
  format %{ "vpslld  $dst,$src,$shift\t! left shift packed8I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9162
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9163
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9164
    __ vpslld($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9165
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9166
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9167
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9168
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9169
instruct vsll16I_reg(vecZ dst, vecZ src, vecS shift) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9170
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9171
  match(Set dst (LShiftVI src shift));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9172
  format %{ "vpslld  $dst,$src,$shift\t! left shift packed16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9173
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9174
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9175
    __ vpslld($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9176
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9177
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9178
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9179
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9180
instruct vsll16I_reg_imm(vecZ dst, vecZ src, immI8 shift) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9181
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9182
  match(Set dst (LShiftVI src shift));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9183
  format %{ "vpslld  $dst,$src,$shift\t! left shift packed16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9184
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9185
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9186
    __ vpslld($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9187
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9188
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9189
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9190
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9191
// Longs vector left shift
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  9192
instruct vsll2L(vecX dst, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9193
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9194
  match(Set dst (LShiftVL dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9195
  format %{ "psllq   $dst,$shift\t! left shift packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9196
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9197
    __ psllq($dst$$XMMRegister, $shift$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9198
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9199
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9200
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9201
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9202
instruct vsll2L_imm(vecX dst, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9203
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9204
  match(Set dst (LShiftVL dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9205
  format %{ "psllq   $dst,$shift\t! left shift packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9206
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9207
    __ psllq($dst$$XMMRegister, (int)$shift$$constant);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9208
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9209
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9210
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9211
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  9212
instruct vsll2L_reg(vecX dst, vecX src, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9213
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9214
  match(Set dst (LShiftVL src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9215
  format %{ "vpsllq  $dst,$src,$shift\t! left shift packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9216
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9217
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9218
    __ vpsllq($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9219
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9220
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9221
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9222
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9223
instruct vsll2L_reg_imm(vecX dst, vecX src, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9224
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9225
  match(Set dst (LShiftVL src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9226
  format %{ "vpsllq  $dst,$src,$shift\t! left shift packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9227
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9228
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9229
    __ vpsllq($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9230
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9231
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9232
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9233
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  9234
instruct vsll4L_reg(vecY dst, vecY src, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9235
  predicate(UseAVX > 1 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9236
  match(Set dst (LShiftVL src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9237
  format %{ "vpsllq  $dst,$src,$shift\t! left shift packed4L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9238
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9239
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9240
    __ vpsllq($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9241
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9242
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9243
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9244
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9245
instruct vsll4L_reg_imm(vecY dst, vecY src, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9246
  predicate(UseAVX > 1 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9247
  match(Set dst (LShiftVL src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9248
  format %{ "vpsllq  $dst,$src,$shift\t! left shift packed4L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9249
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9250
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9251
    __ vpsllq($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9252
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9253
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9254
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9255
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9256
instruct vsll8L_reg(vecZ dst, vecZ src, vecS shift) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9257
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9258
  match(Set dst (LShiftVL src shift));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9259
  format %{ "vpsllq  $dst,$src,$shift\t! left shift packed8L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9260
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9261
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9262
    __ vpsllq($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9263
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9264
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9265
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9266
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9267
instruct vsll8L_reg_imm(vecZ dst, vecZ src, immI8 shift) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9268
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9269
  match(Set dst (LShiftVL src shift));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9270
  format %{ "vpsllq  $dst,$src,$shift\t! left shift packed8L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9271
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9272
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9273
    __ vpsllq($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9274
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9275
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9276
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9277
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9278
// ----------------------- LogicalRightShift -----------------------------------
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9279
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9280
// Shorts vector logical right shift produces incorrect Java result
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9281
// for negative data because java code convert short value into int with
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9282
// sign extension before a shift. But char vectors are fine since chars are
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9283
// unsigned values.
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9284
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9285
instruct vsrl2S(vecS dst, vecS shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9286
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9287
  match(Set dst (URShiftVS dst shift));
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9288
  format %{ "psrlw   $dst,$shift\t! logical right shift packed2S" %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9289
  ins_encode %{
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9290
    __ psrlw($dst$$XMMRegister, $shift$$XMMRegister);
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9291
  %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9292
  ins_pipe( pipe_slow );
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9293
%}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9294
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9295
instruct vsrl2S_imm(vecS dst, immI8 shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9296
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9297
  match(Set dst (URShiftVS dst shift));
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9298
  format %{ "psrlw   $dst,$shift\t! logical right shift packed2S" %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9299
  ins_encode %{
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9300
    __ psrlw($dst$$XMMRegister, (int)$shift$$constant);
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9301
  %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9302
  ins_pipe( pipe_slow );
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9303
%}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9304
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9305
instruct vsrl2S_reg_avx(vecS dst, vecS src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9306
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9307
  match(Set dst (URShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9308
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9309
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9310
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9311
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9312
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9313
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9314
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9315
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9316
instruct vsrl2S_reg_evex(vecS dst, vecS src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9317
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 2);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9318
  match(Set dst (URShiftVS src shift));
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9319
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed2S" %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9320
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9321
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9322
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9323
  %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9324
  ins_pipe( pipe_slow );
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9325
%}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9326
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9327
instruct vsrl2S_reg_evex_special(vecS dst, vecS src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9328
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9329
  match(Set dst (URShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9330
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9331
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9332
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9333
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9334
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9335
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9336
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9337
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9338
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9339
instruct vsrl2S_reg_imm_avx(vecS dst, vecS src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9340
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 2);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9341
  match(Set dst (URShiftVS src shift));
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9342
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed2S" %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9343
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9344
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9345
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9346
  %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9347
  ins_pipe( pipe_slow );
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9348
%}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9349
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9350
instruct vsrl2S_reg_imm_evex(vecS dst, vecS src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9351
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9352
  match(Set dst (URShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9353
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9354
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9355
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9356
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9357
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9358
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9359
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9360
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9361
instruct vsrl2S_reg_imm_evex_special(vecS dst, vecS src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9362
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9363
  match(Set dst (URShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9364
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9365
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9366
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9367
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9368
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9369
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9370
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9371
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9372
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9373
instruct vsrl4S(vecD dst, vecS shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9374
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9375
  match(Set dst (URShiftVS dst shift));
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9376
  format %{ "psrlw   $dst,$shift\t! logical right shift packed4S" %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9377
  ins_encode %{
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9378
    __ psrlw($dst$$XMMRegister, $shift$$XMMRegister);
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9379
  %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9380
  ins_pipe( pipe_slow );
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9381
%}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9382
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9383
instruct vsrl4S_imm(vecD dst, immI8 shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9384
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9385
  match(Set dst (URShiftVS dst shift));
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9386
  format %{ "psrlw   $dst,$shift\t! logical right shift packed4S" %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9387
  ins_encode %{
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9388
    __ psrlw($dst$$XMMRegister, (int)$shift$$constant);
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9389
  %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9390
  ins_pipe( pipe_slow );
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9391
%}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9392
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9393
instruct vsrl4S_reg_avx(vecD dst, vecD src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9394
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9395
  match(Set dst (URShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9396
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9397
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9398
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9399
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9400
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9401
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9402
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9403
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9404
instruct vsrl4S_reg_evex(vecD dst, vecD src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9405
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 4);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9406
  match(Set dst (URShiftVS src shift));
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9407
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed4S" %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9408
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9409
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9410
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9411
  %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9412
  ins_pipe( pipe_slow );
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9413
%}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9414
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9415
instruct vsrl4S_reg_evex_special(vecD dst, vecD src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9416
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9417
  match(Set dst (URShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9418
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9419
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9420
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9421
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9422
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9423
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9424
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9425
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9426
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9427
instruct vsrl4S_reg_imm_avx(vecD dst, vecD src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9428
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 4);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9429
  match(Set dst (URShiftVS src shift));
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9430
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed4S" %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9431
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9432
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9433
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9434
  %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9435
  ins_pipe( pipe_slow );
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9436
%}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9437
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9438
instruct vsrl4S_reg_imm_evex(vecD dst, vecD src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9439
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9440
  match(Set dst (URShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9441
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9442
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9443
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9444
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9445
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9446
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9447
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9448
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9449
instruct vsrl4S_reg_imm_evex_special(vecD dst, vecD src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9450
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9451
  match(Set dst (URShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9452
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9453
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9454
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9455
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9456
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9457
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9458
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9459
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9460
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9461
instruct vsrl8S(vecX dst, vecS shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9462
  predicate(UseAVX == 0 && n->as_Vector()->length() == 8);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9463
  match(Set dst (URShiftVS dst shift));
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9464
  format %{ "psrlw   $dst,$shift\t! logical right shift packed8S" %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9465
  ins_encode %{
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9466
    __ psrlw($dst$$XMMRegister, $shift$$XMMRegister);
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9467
  %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9468
  ins_pipe( pipe_slow );
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9469
%}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9470
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9471
instruct vsrl8S_imm(vecX dst, immI8 shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9472
  predicate(UseAVX == 0 && n->as_Vector()->length() == 8);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9473
  match(Set dst (URShiftVS dst shift));
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9474
  format %{ "psrlw   $dst,$shift\t! logical right shift packed8S" %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9475
  ins_encode %{
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9476
    __ psrlw($dst$$XMMRegister, (int)$shift$$constant);
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9477
  %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9478
  ins_pipe( pipe_slow );
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9479
%}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9480
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9481
instruct vsrl8S_reg_avx(vecX dst, vecX src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9482
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9483
  match(Set dst (URShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9484
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9485
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9486
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9487
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9488
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9489
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9490
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9491
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9492
instruct vsrl8S_reg_evex(vecX dst, vecX src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9493
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 8);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9494
  match(Set dst (URShiftVS src shift));
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9495
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed8S" %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9496
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9497
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9498
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9499
  %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9500
  ins_pipe( pipe_slow );
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9501
%}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9502
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9503
instruct vsrl8S_reg_evex_special(vecX dst, vecX src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9504
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9505
  match(Set dst (URShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9506
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9507
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9508
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9509
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9510
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9511
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9512
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9513
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9514
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9515
instruct vsrl8S_reg_imm_avx(vecX dst, vecX src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9516
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9517
  match(Set dst (URShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9518
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9519
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9520
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9521
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9522
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9523
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9524
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9525
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9526
instruct vsrl8S_reg_imm_evex(vecX dst, vecX src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9527
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 8);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9528
  match(Set dst (URShiftVS src shift));
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9529
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed8S" %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9530
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9531
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9532
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9533
  %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9534
  ins_pipe( pipe_slow );
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9535
%}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9536
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9537
instruct vsrl8S_reg_imm_evex_special(vecX dst, vecX src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9538
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9539
  match(Set dst (URShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9540
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9541
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9542
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9543
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9544
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9545
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9546
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9547
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9548
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9549
instruct vsrl16S_reg_avx(vecY dst, vecY src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9550
  predicate(VM_Version::supports_avx256only() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9551
  match(Set dst (URShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9552
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9553
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9554
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9555
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9556
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9557
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9558
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9559
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9560
instruct vsrl16S_reg_evex(vecY dst, vecY src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9561
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 16);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9562
  match(Set dst (URShiftVS src shift));
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9563
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed16S" %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9564
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9565
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9566
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9567
  %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9568
  ins_pipe( pipe_slow );
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9569
%}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9570
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9571
instruct vsrl16S_reg_evex_special(vecY dst, vecY src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9572
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9573
  match(Set dst (URShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9574
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9575
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9576
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9577
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9578
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9579
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9580
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9581
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9582
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9583
instruct vsrl16S_reg_imm_avx(vecY dst, vecY src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9584
  predicate(VM_Version::supports_avx256only() && n->as_Vector()->length() == 16);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9585
  match(Set dst (URShiftVS src shift));
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9586
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed16S" %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9587
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9588
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9589
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9590
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9591
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9592
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9593
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9594
instruct vsrl16S_reg_imm_evex(vecY dst, vecY src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9595
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9596
  match(Set dst (URShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9597
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9598
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9599
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9600
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9601
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9602
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9603
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9604
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9605
instruct vsrl16S_reg_imm_evex_special(vecY dst, vecY src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9606
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9607
  match(Set dst (URShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9608
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9609
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9610
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9611
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9612
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9613
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9614
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9615
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9616
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9617
instruct vsrl32S_reg(vecZ dst, vecZ src, vecS shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9618
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9619
  match(Set dst (URShiftVS src shift));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9620
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed32S" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9621
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9622
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9623
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9624
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9625
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9626
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9627
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9628
instruct vsrl32S_reg_imm(vecZ dst, vecZ src, immI8 shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9629
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9630
  match(Set dst (URShiftVS src shift));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9631
  format %{ "vpsrlw  $dst,$src,$shift\t! logical right shift packed32S" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9632
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9633
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9634
    __ vpsrlw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
14131
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9635
  %}
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9636
  ins_pipe( pipe_slow );
e376e3d428c9 8001183: incorrect results of char vectors right shift operaiton
kvn
parents: 13930
diff changeset
  9637
%}
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9638
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9639
// Integers vector logical right shift
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  9640
instruct vsrl2I(vecD dst, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9641
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9642
  match(Set dst (URShiftVI dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9643
  format %{ "psrld   $dst,$shift\t! logical right shift packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9644
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9645
    __ psrld($dst$$XMMRegister, $shift$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9646
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9647
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9648
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9649
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9650
instruct vsrl2I_imm(vecD dst, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9651
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9652
  match(Set dst (URShiftVI dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9653
  format %{ "psrld   $dst,$shift\t! logical right shift packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9654
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9655
    __ psrld($dst$$XMMRegister, (int)$shift$$constant);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9656
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9657
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9658
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9659
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  9660
instruct vsrl2I_reg(vecD dst, vecD src, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9661
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9662
  match(Set dst (URShiftVI src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9663
  format %{ "vpsrld  $dst,$src,$shift\t! logical right shift packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9664
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9665
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9666
    __ vpsrld($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9667
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9668
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9669
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9670
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9671
instruct vsrl2I_reg_imm(vecD dst, vecD src, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9672
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9673
  match(Set dst (URShiftVI src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9674
  format %{ "vpsrld  $dst,$src,$shift\t! logical right shift packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9675
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9676
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9677
    __ vpsrld($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9678
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9679
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9680
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9681
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  9682
instruct vsrl4I(vecX dst, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9683
  predicate(n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9684
  match(Set dst (URShiftVI dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9685
  format %{ "psrld   $dst,$shift\t! logical right shift packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9686
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9687
    __ psrld($dst$$XMMRegister, $shift$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9688
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9689
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9690
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9691
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9692
instruct vsrl4I_imm(vecX dst, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9693
  predicate(n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9694
  match(Set dst (URShiftVI dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9695
  format %{ "psrld   $dst,$shift\t! logical right shift packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9696
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9697
    __ psrld($dst$$XMMRegister, (int)$shift$$constant);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9698
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9699
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9700
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9701
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  9702
instruct vsrl4I_reg(vecX dst, vecX src, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9703
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9704
  match(Set dst (URShiftVI src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9705
  format %{ "vpsrld  $dst,$src,$shift\t! logical right shift packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9706
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9707
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9708
    __ vpsrld($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9709
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9710
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9711
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9712
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9713
instruct vsrl4I_reg_imm(vecX dst, vecX src, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9714
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9715
  match(Set dst (URShiftVI src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9716
  format %{ "vpsrld  $dst,$src,$shift\t! logical right shift packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9717
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9718
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9719
    __ vpsrld($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9720
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9721
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9722
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9723
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  9724
instruct vsrl8I_reg(vecY dst, vecY src, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9725
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9726
  match(Set dst (URShiftVI src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9727
  format %{ "vpsrld  $dst,$src,$shift\t! logical right shift packed8I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9728
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9729
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9730
    __ vpsrld($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9731
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9732
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9733
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9734
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9735
instruct vsrl8I_reg_imm(vecY dst, vecY src, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9736
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9737
  match(Set dst (URShiftVI src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9738
  format %{ "vpsrld  $dst,$src,$shift\t! logical right shift packed8I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9739
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9740
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9741
    __ vpsrld($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9742
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9743
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9744
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9745
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9746
instruct vsrl16I_reg(vecZ dst, vecZ src, vecS shift) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9747
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9748
  match(Set dst (URShiftVI src shift));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9749
  format %{ "vpsrld  $dst,$src,$shift\t! logical right shift packed16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9750
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9751
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9752
    __ vpsrld($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9753
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9754
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9755
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9756
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9757
instruct vsrl16I_reg_imm(vecZ dst, vecZ src, immI8 shift) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9758
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9759
  match(Set dst (URShiftVI src shift));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9760
  format %{ "vpsrld  $dst,$src,$shift\t! logical right shift packed16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9761
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9762
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9763
    __ vpsrld($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9764
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9765
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9766
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9767
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9768
// Longs vector logical right shift
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  9769
instruct vsrl2L(vecX dst, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9770
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9771
  match(Set dst (URShiftVL dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9772
  format %{ "psrlq   $dst,$shift\t! logical right shift packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9773
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9774
    __ psrlq($dst$$XMMRegister, $shift$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9775
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9776
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9777
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9778
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9779
instruct vsrl2L_imm(vecX dst, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9780
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9781
  match(Set dst (URShiftVL dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9782
  format %{ "psrlq   $dst,$shift\t! logical right shift packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9783
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9784
    __ psrlq($dst$$XMMRegister, (int)$shift$$constant);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9785
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9786
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9787
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9788
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  9789
instruct vsrl2L_reg(vecX dst, vecX src, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9790
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9791
  match(Set dst (URShiftVL src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9792
  format %{ "vpsrlq  $dst,$src,$shift\t! logical right shift packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9793
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9794
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9795
    __ vpsrlq($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9796
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9797
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9798
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9799
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9800
instruct vsrl2L_reg_imm(vecX dst, vecX src, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9801
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9802
  match(Set dst (URShiftVL src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9803
  format %{ "vpsrlq  $dst,$src,$shift\t! logical right shift packed2L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9804
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9805
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9806
    __ vpsrlq($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9807
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9808
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9809
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9810
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  9811
instruct vsrl4L_reg(vecY dst, vecY src, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9812
  predicate(UseAVX > 1 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9813
  match(Set dst (URShiftVL src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9814
  format %{ "vpsrlq  $dst,$src,$shift\t! logical right shift packed4L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9815
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9816
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9817
    __ vpsrlq($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9818
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9819
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9820
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9821
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9822
instruct vsrl4L_reg_imm(vecY dst, vecY src, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9823
  predicate(UseAVX > 1 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9824
  match(Set dst (URShiftVL src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9825
  format %{ "vpsrlq  $dst,$src,$shift\t! logical right shift packed4L" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9826
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9827
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9828
    __ vpsrlq($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9829
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9830
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9831
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9832
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9833
instruct vsrl8L_reg(vecZ dst, vecZ src, vecS shift) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9834
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9835
  match(Set dst (URShiftVL src shift));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9836
  format %{ "vpsrlq  $dst,$src,$shift\t! logical right shift packed8L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9837
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9838
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9839
    __ vpsrlq($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9840
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9841
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9842
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9843
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9844
instruct vsrl8L_reg_imm(vecZ dst, vecZ src, immI8 shift) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9845
  predicate(UseAVX > 2 && n->as_Vector()->length() == 8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9846
  match(Set dst (URShiftVL src shift));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9847
  format %{ "vpsrlq  $dst,$src,$shift\t! logical right shift packed8L" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9848
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9849
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9850
    __ vpsrlq($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9851
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9852
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9853
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9854
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9855
// ------------------- ArithmeticRightShift -----------------------------------
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9856
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9857
// Shorts/Chars vector arithmetic right shift
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  9858
instruct vsra2S(vecS dst, vecS shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9859
  predicate(UseAVX == 0 && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9860
  match(Set dst (RShiftVS dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9861
  format %{ "psraw   $dst,$shift\t! arithmetic right shift packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9862
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9863
    __ psraw($dst$$XMMRegister, $shift$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9864
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9865
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9866
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9867
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9868
instruct vsra2S_imm(vecS dst, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9869
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9870
  match(Set dst (RShiftVS dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9871
  format %{ "psraw   $dst,$shift\t! arithmetic right shift packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9872
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9873
    __ psraw($dst$$XMMRegister, (int)$shift$$constant);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9874
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9875
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9876
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9877
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9878
instruct vsra2S_reg_avx(vecS dst, vecS src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9879
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9880
  match(Set dst (RShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9881
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9882
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9883
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9884
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9885
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9886
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9887
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9888
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9889
instruct vsra2S_reg_evex(vecS dst, vecS src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9890
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9891
  match(Set dst (RShiftVS src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9892
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9893
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9894
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9895
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9896
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9897
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9898
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9899
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9900
instruct vsra2S_reg_evex_special(vecS dst, vecS src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9901
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9902
  match(Set dst (RShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9903
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9904
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9905
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9906
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9907
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9908
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9909
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9910
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9911
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9912
instruct vsra2S_reg_imm_avx(vecS dst, vecS src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9913
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 2);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9914
  match(Set dst (RShiftVS src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9915
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed2S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9916
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9917
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9918
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9919
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9920
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9921
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9922
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9923
instruct vsra2S_reg_imm_evex(vecS dst, vecS src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9924
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9925
  match(Set dst (RShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9926
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9927
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9928
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9929
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9930
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9931
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9932
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9933
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9934
instruct vsra2S_reg_imm_evex_special(vecS dst, vecS src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9935
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 2);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9936
  match(Set dst (RShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9937
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9938
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed2S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9939
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9940
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9941
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9942
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9943
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9944
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9945
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
  9946
instruct vsra4S(vecD dst, vecS shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9947
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9948
  match(Set dst (RShiftVS dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9949
  format %{ "psraw   $dst,$shift\t! arithmetic right shift packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9950
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9951
    __ psraw($dst$$XMMRegister, $shift$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9952
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9953
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9954
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9955
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9956
instruct vsra4S_imm(vecD dst, immI8 shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9957
  predicate(UseAVX == 0 && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9958
  match(Set dst (RShiftVS dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9959
  format %{ "psraw   $dst,$shift\t! arithmetic right shift packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9960
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9961
    __ psraw($dst$$XMMRegister, (int)$shift$$constant);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9962
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9963
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9964
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9965
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9966
instruct vsra4S_reg_avx(vecD dst, vecD src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9967
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9968
  match(Set dst (RShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9969
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9970
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9971
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9972
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9973
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9974
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9975
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9976
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9977
instruct vsra4S_reg_evex(vecD dst, vecD src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9978
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9979
  match(Set dst (RShiftVS src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9980
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9981
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9982
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
  9983
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9984
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9985
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9986
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
  9987
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9988
instruct vsra4S_reg_evex_special(vecD dst, vecD src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9989
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9990
  match(Set dst (RShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9991
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9992
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9993
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9994
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9995
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9996
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9997
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9998
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
  9999
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10000
instruct vsra4S_reg_imm_avx(vecD dst, vecD src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10001
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 4);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10002
  match(Set dst (RShiftVS src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10003
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed4S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10004
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10005
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10006
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10007
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10008
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10009
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10010
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10011
instruct vsra4S_reg_imm_evex(vecD dst, vecD src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10012
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10013
  match(Set dst (RShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10014
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10015
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10016
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10017
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10018
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10019
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10020
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10021
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10022
instruct vsra4S_reg_imm_evex_special(vecD dst, vecD src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10023
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 4);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10024
  match(Set dst (RShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10025
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10026
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed4S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10027
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10028
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10029
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10030
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10031
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10032
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10033
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
 10034
instruct vsra8S(vecX dst, vecS shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10035
  predicate(UseAVX == 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10036
  match(Set dst (RShiftVS dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10037
  format %{ "psraw   $dst,$shift\t! arithmetic right shift packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10038
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10039
    __ psraw($dst$$XMMRegister, $shift$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10040
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10041
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10042
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10043
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10044
instruct vsra8S_imm(vecX dst, immI8 shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10045
  predicate(UseAVX == 0 && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10046
  match(Set dst (RShiftVS dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10047
  format %{ "psraw   $dst,$shift\t! arithmetic right shift packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10048
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10049
    __ psraw($dst$$XMMRegister, (int)$shift$$constant);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10050
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10051
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10052
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10053
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10054
instruct vsra8S_reg_avx(vecX dst, vecX src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10055
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10056
  match(Set dst (RShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10057
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10058
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10059
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10060
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10061
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10062
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10063
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10064
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10065
instruct vsra8S_reg_evex(vecX dst, vecX src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10066
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10067
  match(Set dst (RShiftVS src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10068
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10069
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10070
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10071
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10072
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10073
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10074
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10075
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10076
instruct vsra8S_reg_evex_special(vecX dst, vecX src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10077
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10078
  match(Set dst (RShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10079
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10080
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10081
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10082
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10083
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10084
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10085
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10086
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10087
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10088
instruct vsra8S_reg_imm_avx(vecX dst, vecX src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10089
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10090
  match(Set dst (RShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10091
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10092
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10093
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10094
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10095
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10096
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10097
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10098
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10099
instruct vsra8S_reg_imm_evex(vecX dst, vecX src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10100
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 8);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10101
  match(Set dst (RShiftVS src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10102
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed8S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10103
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10104
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10105
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10106
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10107
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10108
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10109
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10110
instruct vsra8S_reg_imm_evex_special(vecX dst, vecX src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10111
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 8);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10112
  match(Set dst (RShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10113
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10114
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed8S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10115
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10116
    int vector_len = 0;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10117
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10118
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10119
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10120
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10121
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10122
instruct vsra16S_reg_avx(vecY dst, vecY src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10123
  predicate(VM_Version::supports_avx256only() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10124
  match(Set dst (RShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10125
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10126
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10127
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10128
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10129
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10130
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10131
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10132
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10133
instruct vsra16S_reg_evex(vecY dst, vecY src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10134
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10135
  match(Set dst (RShiftVS src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10136
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed16S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10137
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10138
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10139
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10140
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10141
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10142
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10143
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10144
instruct vsra16S_reg_evex_special(vecY dst, vecY src, vecS shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10145
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10146
  match(Set dst (RShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10147
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10148
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10149
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10150
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10151
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10152
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10153
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10154
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10155
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10156
instruct vsra16S_reg_imm_avx(vecY dst, vecY src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10157
  predicate(VM_Version::supports_avxonly() && n->as_Vector()->length() == 16);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10158
  match(Set dst (RShiftVS src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10159
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed16S" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10160
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10161
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10162
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10163
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10164
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10165
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10166
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10167
instruct vsra16S_reg_imm_evex(vecY dst, vecY src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10168
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10169
  match(Set dst (RShiftVS src shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10170
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10171
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10172
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10173
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10174
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10175
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10176
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10177
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10178
instruct vsra16S_reg_imm_evex_special(vecY dst, vecY src, immI8 shift) %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10179
  predicate(VM_Version::supports_avx512nobw() && n->as_Vector()->length() == 16);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10180
  match(Set dst (RShiftVS dst shift));
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10181
  effect(TEMP src);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10182
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed16S" %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10183
  ins_encode %{
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10184
    int vector_len = 1;
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10185
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10186
  %}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10187
  ins_pipe( pipe_slow );
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10188
%}
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10189
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10190
instruct vsra32S_reg(vecZ dst, vecZ src, vecS shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10191
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10192
  match(Set dst (RShiftVS src shift));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10193
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed32S" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10194
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10195
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10196
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10197
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10198
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10199
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10200
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10201
instruct vsra32S_reg_imm(vecZ dst, vecZ src, immI8 shift) %{
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33469
diff changeset
 10202
  predicate(VM_Version::supports_avx512bw() && n->as_Vector()->length() == 32);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10203
  match(Set dst (RShiftVS src shift));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10204
  format %{ "vpsraw  $dst,$src,$shift\t! arithmetic right shift packed32S" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10205
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10206
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10207
    __ vpsraw($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10208
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10209
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10210
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10211
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10212
// Integers vector arithmetic right shift
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
 10213
instruct vsra2I(vecD dst, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10214
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10215
  match(Set dst (RShiftVI dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10216
  format %{ "psrad   $dst,$shift\t! arithmetic right shift packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10217
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10218
    __ psrad($dst$$XMMRegister, $shift$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10219
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10220
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10221
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10222
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10223
instruct vsra2I_imm(vecD dst, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10224
  predicate(n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10225
  match(Set dst (RShiftVI dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10226
  format %{ "psrad   $dst,$shift\t! arithmetic right shift packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10227
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10228
    __ psrad($dst$$XMMRegister, (int)$shift$$constant);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10229
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10230
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10231
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10232
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
 10233
instruct vsra2I_reg(vecD dst, vecD src, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10234
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10235
  match(Set dst (RShiftVI src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10236
  format %{ "vpsrad  $dst,$src,$shift\t! arithmetic right shift packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10237
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10238
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10239
    __ vpsrad($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10240
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10241
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10242
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10243
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10244
instruct vsra2I_reg_imm(vecD dst, vecD src, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10245
  predicate(UseAVX > 0 && n->as_Vector()->length() == 2);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10246
  match(Set dst (RShiftVI src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10247
  format %{ "vpsrad  $dst,$src,$shift\t! arithmetic right shift packed2I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10248
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10249
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10250
    __ vpsrad($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10251
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10252
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10253
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10254
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
 10255
instruct vsra4I(vecX dst, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10256
  predicate(n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10257
  match(Set dst (RShiftVI dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10258
  format %{ "psrad   $dst,$shift\t! arithmetic right shift packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10259
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10260
    __ psrad($dst$$XMMRegister, $shift$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10261
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10262
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10263
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10264
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10265
instruct vsra4I_imm(vecX dst, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10266
  predicate(n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10267
  match(Set dst (RShiftVI dst shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10268
  format %{ "psrad   $dst,$shift\t! arithmetic right shift packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10269
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10270
    __ psrad($dst$$XMMRegister, (int)$shift$$constant);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10271
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10272
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10273
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10274
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
 10275
instruct vsra4I_reg(vecX dst, vecX src, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10276
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10277
  match(Set dst (RShiftVI src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10278
  format %{ "vpsrad  $dst,$src,$shift\t! arithmetic right shift packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10279
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10280
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10281
    __ vpsrad($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10282
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10283
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10284
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10285
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10286
instruct vsra4I_reg_imm(vecX dst, vecX src, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10287
  predicate(UseAVX > 0 && n->as_Vector()->length() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10288
  match(Set dst (RShiftVI src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10289
  format %{ "vpsrad  $dst,$src,$shift\t! arithmetic right shift packed4I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10290
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10291
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10292
    __ vpsrad($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10293
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10294
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10295
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10296
13930
8df570f94294 7201026: add vector for shift count
kvn
parents: 13886
diff changeset
 10297
instruct vsra8I_reg(vecY dst, vecY src, vecS shift) %{
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10298
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10299
  match(Set dst (RShiftVI src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10300
  format %{ "vpsrad  $dst,$src,$shift\t! arithmetic right shift packed8I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10301
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10302
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10303
    __ vpsrad($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10304
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10305
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10306
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10307
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10308
instruct vsra8I_reg_imm(vecY dst, vecY src, immI8 shift) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10309
  predicate(UseAVX > 1 && n->as_Vector()->length() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10310
  match(Set dst (RShiftVI src shift));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10311
  format %{ "vpsrad  $dst,$src,$shift\t! arithmetic right shift packed8I" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10312
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10313
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10314
    __ vpsrad($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10315
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10316
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10317
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10318
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10319
instruct vsra16I_reg(vecZ dst, vecZ src, vecS shift) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10320
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10321
  match(Set dst (RShiftVI src shift));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10322
  format %{ "vpsrad  $dst,$src,$shift\t! arithmetic right shift packed16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10323
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10324
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10325
    __ vpsrad($dst$$XMMRegister, $src$$XMMRegister, $shift$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10326
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10327
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10328
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10329
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10330
instruct vsra16I_reg_imm(vecZ dst, vecZ src, immI8 shift) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10331
  predicate(UseAVX > 2 && n->as_Vector()->length() == 16);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10332
  match(Set dst (RShiftVI src shift));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10333
  format %{ "vpsrad  $dst,$src,$shift\t! arithmetic right shift packed16I" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10334
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10335
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10336
    __ vpsrad($dst$$XMMRegister, $src$$XMMRegister, (int)$shift$$constant, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10337
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10338
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10339
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10340
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10341
// There are no longs vector arithmetic right shift instructions.
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10342
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10343
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10344
// --------------------------------- AND --------------------------------------
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10345
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10346
instruct vand4B(vecS dst, vecS src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10347
  predicate(n->as_Vector()->length_in_bytes() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10348
  match(Set dst (AndV dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10349
  format %{ "pand    $dst,$src\t! and vectors (4 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10350
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10351
    __ pand($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10352
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10353
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10354
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10355
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10356
instruct vand4B_reg(vecS dst, vecS src1, vecS src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10357
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10358
  match(Set dst (AndV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10359
  format %{ "vpand   $dst,$src1,$src2\t! and vectors (4 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10360
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10361
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10362
    __ vpand($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10363
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10364
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10365
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10366
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10367
instruct vand4B_mem(vecS dst, vecS src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10368
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 4);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10369
  match(Set dst (AndV src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10370
  format %{ "vpand   $dst,$src,$mem\t! and vectors (4 bytes)" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10371
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10372
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10373
    __ vpand($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10374
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10375
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10376
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10377
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10378
instruct vand8B(vecD dst, vecD src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10379
  predicate(n->as_Vector()->length_in_bytes() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10380
  match(Set dst (AndV dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10381
  format %{ "pand    $dst,$src\t! and vectors (8 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10382
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10383
    __ pand($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10384
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10385
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10386
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10387
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10388
instruct vand8B_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10389
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10390
  match(Set dst (AndV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10391
  format %{ "vpand   $dst,$src1,$src2\t! and vectors (8 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10392
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10393
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10394
    __ vpand($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10395
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10396
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10397
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10398
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10399
instruct vand8B_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10400
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 8);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10401
  match(Set dst (AndV src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10402
  format %{ "vpand   $dst,$src,$mem\t! and vectors (8 bytes)" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10403
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10404
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10405
    __ vpand($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10406
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10407
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10408
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10409
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10410
instruct vand16B(vecX dst, vecX src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10411
  predicate(n->as_Vector()->length_in_bytes() == 16);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10412
  match(Set dst (AndV dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10413
  format %{ "pand    $dst,$src\t! and vectors (16 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10414
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10415
    __ pand($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10416
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10417
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10418
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10419
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10420
instruct vand16B_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10421
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 16);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10422
  match(Set dst (AndV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10423
  format %{ "vpand   $dst,$src1,$src2\t! and vectors (16 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10424
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10425
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10426
    __ vpand($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10427
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10428
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10429
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10430
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10431
instruct vand16B_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10432
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 16);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10433
  match(Set dst (AndV src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10434
  format %{ "vpand   $dst,$src,$mem\t! and vectors (16 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10435
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10436
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10437
    __ vpand($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10438
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10439
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10440
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10441
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10442
instruct vand32B_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10443
  predicate(UseAVX > 1 && n->as_Vector()->length_in_bytes() == 32);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10444
  match(Set dst (AndV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10445
  format %{ "vpand   $dst,$src1,$src2\t! and vectors (32 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10446
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10447
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10448
    __ vpand($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10449
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10450
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10451
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10452
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10453
instruct vand32B_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10454
  predicate(UseAVX > 1 && n->as_Vector()->length_in_bytes() == 32);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10455
  match(Set dst (AndV src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10456
  format %{ "vpand   $dst,$src,$mem\t! and vectors (32 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10457
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10458
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10459
    __ vpand($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10460
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10461
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10462
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10463
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10464
instruct vand64B_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10465
  predicate(UseAVX > 2 && n->as_Vector()->length_in_bytes() == 64);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10466
  match(Set dst (AndV src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10467
  format %{ "vpand   $dst,$src1,$src2\t! and vectors (64 bytes)" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10468
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10469
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10470
    __ vpand($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10471
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10472
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10473
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10474
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10475
instruct vand64B_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10476
  predicate(UseAVX > 2 && n->as_Vector()->length_in_bytes() == 64);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10477
  match(Set dst (AndV src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10478
  format %{ "vpand   $dst,$src,$mem\t! and vectors (64 bytes)" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10479
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10480
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10481
    __ vpand($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10482
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10483
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10484
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10486
// --------------------------------- OR ---------------------------------------
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10487
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10488
instruct vor4B(vecS dst, vecS src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10489
  predicate(n->as_Vector()->length_in_bytes() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10490
  match(Set dst (OrV dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10491
  format %{ "por     $dst,$src\t! or vectors (4 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10492
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10493
    __ por($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10494
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10495
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10496
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10497
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10498
instruct vor4B_reg(vecS dst, vecS src1, vecS src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10499
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10500
  match(Set dst (OrV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10501
  format %{ "vpor    $dst,$src1,$src2\t! or vectors (4 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10502
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10503
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10504
    __ vpor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10505
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10506
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10507
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10508
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10509
instruct vor4B_mem(vecS dst, vecS src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10510
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 4);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10511
  match(Set dst (OrV src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10512
  format %{ "vpor    $dst,$src,$mem\t! or vectors (4 bytes)" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10513
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10514
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10515
    __ vpor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10516
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10517
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10518
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10519
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10520
instruct vor8B(vecD dst, vecD src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10521
  predicate(n->as_Vector()->length_in_bytes() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10522
  match(Set dst (OrV dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10523
  format %{ "por     $dst,$src\t! or vectors (8 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10524
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10525
    __ por($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10526
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10527
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10528
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10529
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10530
instruct vor8B_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10531
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10532
  match(Set dst (OrV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10533
  format %{ "vpor    $dst,$src1,$src2\t! or vectors (8 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10534
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10535
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10536
    __ vpor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10537
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10538
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10539
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10540
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10541
instruct vor8B_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10542
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 4);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10543
  match(Set dst (OrV src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10544
  format %{ "vpor    $dst,$src,$mem\t! or vectors (8 bytes)" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10545
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10546
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10547
    __ vpor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10548
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10549
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10550
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10551
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10552
instruct vor16B(vecX dst, vecX src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10553
  predicate(n->as_Vector()->length_in_bytes() == 16);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10554
  match(Set dst (OrV dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10555
  format %{ "por     $dst,$src\t! or vectors (16 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10556
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10557
    __ por($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10558
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10559
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10560
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10561
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10562
instruct vor16B_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10563
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 16);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10564
  match(Set dst (OrV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10565
  format %{ "vpor    $dst,$src1,$src2\t! or vectors (16 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10566
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10567
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10568
    __ vpor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10569
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10570
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10571
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10572
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10573
instruct vor16B_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10574
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 16);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10575
  match(Set dst (OrV src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10576
  format %{ "vpor    $dst,$src,$mem\t! or vectors (16 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10577
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10578
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10579
    __ vpor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10580
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10581
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10582
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10583
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10584
instruct vor32B_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10585
  predicate(UseAVX > 1 && n->as_Vector()->length_in_bytes() == 32);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10586
  match(Set dst (OrV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10587
  format %{ "vpor    $dst,$src1,$src2\t! or vectors (32 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10588
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10589
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10590
    __ vpor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10591
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10592
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10593
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10594
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10595
instruct vor32B_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10596
  predicate(UseAVX > 1 && n->as_Vector()->length_in_bytes() == 32);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10597
  match(Set dst (OrV src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10598
  format %{ "vpor    $dst,$src,$mem\t! or vectors (32 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10599
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10600
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10601
    __ vpor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10602
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10603
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10604
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10605
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10606
instruct vor64B_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10607
  predicate(UseAVX > 2 && n->as_Vector()->length_in_bytes() == 64);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10608
  match(Set dst (OrV src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10609
  format %{ "vpor    $dst,$src1,$src2\t! or vectors (64 bytes)" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10610
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10611
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10612
    __ vpor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10613
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10614
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10615
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10616
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10617
instruct vor64B_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10618
  predicate(UseAVX > 2 && n->as_Vector()->length_in_bytes() == 64);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10619
  match(Set dst (OrV src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10620
  format %{ "vpor    $dst,$src,$mem\t! or vectors (64 bytes)" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10621
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10622
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10623
    __ vpor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10624
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10625
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10626
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10627
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10628
// --------------------------------- XOR --------------------------------------
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10629
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10630
instruct vxor4B(vecS dst, vecS src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10631
  predicate(n->as_Vector()->length_in_bytes() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10632
  match(Set dst (XorV dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10633
  format %{ "pxor    $dst,$src\t! xor vectors (4 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10634
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10635
    __ pxor($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10636
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10637
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10638
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10639
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10640
instruct vxor4B_reg(vecS dst, vecS src1, vecS src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10641
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 4);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10642
  match(Set dst (XorV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10643
  format %{ "vpxor   $dst,$src1,$src2\t! xor vectors (4 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10644
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10645
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10646
    __ vpxor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10647
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10648
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10649
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10650
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10651
instruct vxor4B_mem(vecS dst, vecS src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10652
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 4);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10653
  match(Set dst (XorV src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10654
  format %{ "vpxor   $dst,$src,$mem\t! xor vectors (4 bytes)" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10655
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10656
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10657
    __ vpxor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10658
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10659
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10660
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10661
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10662
instruct vxor8B(vecD dst, vecD src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10663
  predicate(n->as_Vector()->length_in_bytes() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10664
  match(Set dst (XorV dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10665
  format %{ "pxor    $dst,$src\t! xor vectors (8 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10666
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10667
    __ pxor($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10668
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10669
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10670
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10671
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10672
instruct vxor8B_reg(vecD dst, vecD src1, vecD src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10673
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 8);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10674
  match(Set dst (XorV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10675
  format %{ "vpxor   $dst,$src1,$src2\t! xor vectors (8 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10676
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10677
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10678
    __ vpxor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10679
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10680
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10681
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10682
31410
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10683
instruct vxor8B_mem(vecD dst, vecD src, memory mem) %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10684
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 8);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10685
  match(Set dst (XorV src (LoadVector mem)));
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10686
  format %{ "vpxor   $dst,$src,$mem\t! xor vectors (8 bytes)" %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10687
  ins_encode %{
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10688
    int vector_len = 0;
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10689
    __ vpxor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10690
  %}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10691
  ins_pipe( pipe_slow );
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10692
%}
2a222ae1205f 8081247: AVX 512 extended support
mcberg
parents: 30624
diff changeset
 10693
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10694
instruct vxor16B(vecX dst, vecX src) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10695
  predicate(n->as_Vector()->length_in_bytes() == 16);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10696
  match(Set dst (XorV dst src));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10697
  format %{ "pxor    $dst,$src\t! xor vectors (16 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10698
  ins_encode %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10699
    __ pxor($dst$$XMMRegister, $src$$XMMRegister);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10700
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10701
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10702
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10703
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10704
instruct vxor16B_reg(vecX dst, vecX src1, vecX src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10705
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 16);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10706
  match(Set dst (XorV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10707
  format %{ "vpxor   $dst,$src1,$src2\t! xor vectors (16 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10708
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10709
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10710
    __ vpxor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10711
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10712
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10713
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10714
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10715
instruct vxor16B_mem(vecX dst, vecX src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10716
  predicate(UseAVX > 0 && n->as_Vector()->length_in_bytes() == 16);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10717
  match(Set dst (XorV src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10718
  format %{ "vpxor   $dst,$src,$mem\t! xor vectors (16 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10719
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10720
    int vector_len = 0;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10721
    __ vpxor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10722
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10723
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10724
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10725
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10726
instruct vxor32B_reg(vecY dst, vecY src1, vecY src2) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10727
  predicate(UseAVX > 1 && n->as_Vector()->length_in_bytes() == 32);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10728
  match(Set dst (XorV src1 src2));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10729
  format %{ "vpxor   $dst,$src1,$src2\t! xor vectors (32 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10730
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10731
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10732
    __ vpxor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
13485
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10733
  %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10734
  ins_pipe( pipe_slow );
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10735
%}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10736
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10737
instruct vxor32B_mem(vecY dst, vecY src, memory mem) %{
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10738
  predicate(UseAVX > 1 && n->as_Vector()->length_in_bytes() == 32);
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10739
  match(Set dst (XorV src (LoadVector mem)));
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10740
  format %{ "vpxor   $dst,$src,$mem\t! xor vectors (32 bytes)" %}
6c7faa516fc6 6340864: Implement vectorization optimizations in hotspot-server
kvn
parents: 13294
diff changeset
 10741
  ins_encode %{
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10742
    int vector_len = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10743
    __ vpxor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10744
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10745
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10746
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10747
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10748
instruct vxor64B_reg(vecZ dst, vecZ src1, vecZ src2) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10749
  predicate(UseAVX > 2 && n->as_Vector()->length_in_bytes() == 64);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10750
  match(Set dst (XorV src1 src2));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10751
  format %{ "vpxor   $dst,$src1,$src2\t! xor vectors (64 bytes)" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10752
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10753
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10754
    __ vpxor($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10755
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10756
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10757
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10758
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10759
instruct vxor64B_mem(vecZ dst, vecZ src, memory mem) %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10760
  predicate(UseAVX > 2 && n->as_Vector()->length_in_bytes() == 64);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10761
  match(Set dst (XorV src (LoadVector mem)));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10762
  format %{ "vpxor   $dst,$src,$mem\t! xor vectors (64 bytes)" %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10763
  ins_encode %{
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10764
    int vector_len = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10765
    __ vpxor($dst$$XMMRegister, $src$$XMMRegister, $mem$$Address, vector_len);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10766
  %}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10767
  ins_pipe( pipe_slow );
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10768
%}
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30305
diff changeset
 10769
46528
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10770
// --------------------------------- FMA --------------------------------------
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10771
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10772
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10773
instruct vfma2D_reg(vecX a, vecX b, vecX c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10774
  predicate(UseFMA && n->as_Vector()->length() == 2);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10775
  match(Set c (FmaVD  c (Binary a b)));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10776
  format %{ "fmapd $a,$b,$c\t# $c = $a * $b + $c fma packed2D" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10777
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10778
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10779
    int vector_len = 0;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10780
    __ vfmad($c$$XMMRegister, $a$$XMMRegister, $b$$XMMRegister, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10781
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10782
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10783
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10784
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10785
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10786
instruct vfma2D_mem(vecX a, memory b, vecX c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10787
  predicate(UseFMA && n->as_Vector()->length() == 2);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10788
  match(Set c (FmaVD  c (Binary a (LoadVector b))));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10789
  format %{ "fmapd $a,$b,$c\t# $c = $a * $b + $c fma packed2D" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10790
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10791
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10792
    int vector_len = 0;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10793
    __ vfmad($c$$XMMRegister, $a$$XMMRegister, $b$$Address, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10794
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10795
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10796
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10797
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10798
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10799
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10800
instruct vfma4D_reg(vecY a, vecY b, vecY c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10801
  predicate(UseFMA && n->as_Vector()->length() == 4);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10802
  match(Set c (FmaVD  c (Binary a b)));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10803
  format %{ "fmapd $a,$b,$c\t# $c = $a * $b + $c fma packed4D" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10804
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10805
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10806
    int vector_len = 1;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10807
    __ vfmad($c$$XMMRegister, $a$$XMMRegister, $b$$XMMRegister, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10808
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10809
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10810
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10811
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10812
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10813
instruct vfma4D_mem(vecY a, memory b, vecY c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10814
  predicate(UseFMA && n->as_Vector()->length() == 4);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10815
  match(Set c (FmaVD  c (Binary a (LoadVector b))));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10816
  format %{ "fmapd $a,$b,$c\t# $c = $a * $b + $c fma packed4D" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10817
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10818
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10819
    int vector_len = 1;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10820
    __ vfmad($c$$XMMRegister, $a$$XMMRegister, $b$$Address, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10821
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10822
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10823
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10824
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10825
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10826
instruct vfma8D_reg(vecZ a, vecZ b, vecZ c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10827
  predicate(UseFMA && n->as_Vector()->length() == 8);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10828
  match(Set c (FmaVD  c (Binary a b)));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10829
  format %{ "fmapd $a,$b,$c\t# $c = $a * $b + $c fma packed8D" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10830
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10831
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10832
    int vector_len = 2;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10833
    __ vfmad($c$$XMMRegister, $a$$XMMRegister, $b$$XMMRegister, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10834
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10835
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10836
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10837
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10838
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10839
instruct vfma8D_mem(vecZ a, memory b, vecZ c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10840
  predicate(UseFMA && n->as_Vector()->length() == 8);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10841
  match(Set c (FmaVD  c (Binary a (LoadVector b))));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10842
  format %{ "fmapd $a,$b,$c\t# $c = $a * $b + $c fma packed8D" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10843
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10844
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10845
    int vector_len = 2;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10846
    __ vfmad($c$$XMMRegister, $a$$XMMRegister, $b$$Address, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10847
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10848
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10849
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10850
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10851
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10852
instruct vfma4F_reg(vecX a, vecX b, vecX c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10853
  predicate(UseFMA && n->as_Vector()->length() == 4);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10854
  match(Set c (FmaVF  c (Binary a b)));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10855
  format %{ "fmaps $a,$b,$c\t# $c = $a * $b + $c fma packed4F" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10856
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10857
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10858
    int vector_len = 0;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10859
    __ vfmaf($c$$XMMRegister, $a$$XMMRegister, $b$$XMMRegister, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10860
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10861
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10862
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10863
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10864
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10865
instruct vfma4F_mem(vecX a, memory b, vecX c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10866
  predicate(UseFMA && n->as_Vector()->length() == 4);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10867
  match(Set c (FmaVF  c (Binary a (LoadVector b))));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10868
  format %{ "fmaps $a,$b,$c\t# $c = $a * $b + $c fma packed4F" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10869
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10870
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10871
    int vector_len = 0;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10872
    __ vfmaf($c$$XMMRegister, $a$$XMMRegister, $b$$Address, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10873
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10874
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10875
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10876
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10877
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10878
instruct vfma8F_reg(vecY a, vecY b, vecY c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10879
  predicate(UseFMA && n->as_Vector()->length() == 8);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10880
  match(Set c (FmaVF  c (Binary a b)));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10881
  format %{ "fmaps $a,$b,$c\t# $c = $a * $b + $c fma packed8F" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10882
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10883
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10884
    int vector_len = 1;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10885
    __ vfmaf($c$$XMMRegister, $a$$XMMRegister, $b$$XMMRegister, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10886
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10887
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10888
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10889
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10890
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10891
instruct vfma8F_mem(vecY a, memory b, vecY c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10892
  predicate(UseFMA && n->as_Vector()->length() == 8);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10893
  match(Set c (FmaVF  c (Binary a (LoadVector b))));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10894
  format %{ "fmaps $a,$b,$c\t# $c = $a * $b + $c fma packed8F" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10895
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10896
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10897
    int vector_len = 1;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10898
    __ vfmaf($c$$XMMRegister, $a$$XMMRegister, $b$$Address, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10899
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10900
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10901
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10902
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10903
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10904
instruct vfma16F_reg(vecZ a, vecZ b, vecZ c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10905
  predicate(UseFMA && n->as_Vector()->length() == 16);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10906
  match(Set c (FmaVF  c (Binary a b)));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10907
  format %{ "fmaps $a,$b,$c\t# $c = $a * $b + $c fma packed16F" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10908
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10909
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10910
    int vector_len = 2;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10911
    __ vfmaf($c$$XMMRegister, $a$$XMMRegister, $b$$XMMRegister, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10912
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10913
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10914
%}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10915
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10916
// a * b + c
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10917
instruct vfma16F_mem(vecZ a, memory b, vecZ c) %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10918
  predicate(UseFMA && n->as_Vector()->length() == 16);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10919
  match(Set c (FmaVF  c (Binary a (LoadVector b))));
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10920
  format %{ "fmaps $a,$b,$c\t# $c = $a * $b + $c fma packed16F" %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10921
  ins_cost(150);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10922
  ins_encode %{
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10923
    int vector_len = 2;
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10924
    __ vfmaf($c$$XMMRegister, $a$$XMMRegister, $b$$Address, $c$$XMMRegister, vector_len);
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10925
  %}
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10926
  ins_pipe( pipe_slow );
cf0da758e7b5 8181616: FMA Vectorization on x86
vdeshpande
parents: 46525
diff changeset
 10927
%}
49384
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10928
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10929
// --------------------------------- PopCount --------------------------------------
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10930
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10931
instruct vpopcount2I(vecD dst, vecD src) %{
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10932
  predicate(VM_Version::supports_vpopcntdq() && UsePopCountInstruction && n->as_Vector()->length() == 2);
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10933
  match(Set dst (PopCountVI src));
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10934
  format %{ "vpopcntd  $dst,$src\t! vector popcount packed2I" %}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10935
  ins_encode %{
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10936
    int vector_len = 0;
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10937
    __ vpopcntd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10938
  %}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10939
  ins_pipe( pipe_slow );
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10940
%}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10941
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10942
instruct vpopcount4I(vecX dst, vecX src) %{
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10943
  predicate(VM_Version::supports_vpopcntdq() && UsePopCountInstruction && n->as_Vector()->length() == 4);
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10944
  match(Set dst (PopCountVI src));
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10945
  format %{ "vpopcntd  $dst,$src\t! vector popcount packed4I" %}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10946
  ins_encode %{
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10947
    int vector_len = 0;
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10948
    __ vpopcntd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10949
  %}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10950
  ins_pipe( pipe_slow );
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10951
%}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10952
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10953
instruct vpopcount8I(vecY dst, vecY src) %{
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10954
  predicate(VM_Version::supports_vpopcntdq() && UsePopCountInstruction && n->as_Vector()->length() == 8);
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10955
  match(Set dst (PopCountVI src));
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10956
  format %{ "vpopcntd  $dst,$src\t! vector popcount packed8I" %}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10957
  ins_encode %{
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10958
    int vector_len = 1;
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10959
    __ vpopcntd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10960
  %}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10961
  ins_pipe( pipe_slow );
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10962
%}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10963
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10964
instruct vpopcount16I(vecZ dst, vecZ src) %{
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10965
  predicate(VM_Version::supports_vpopcntdq() && UsePopCountInstruction && n->as_Vector()->length() == 16);
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10966
  match(Set dst (PopCountVI src));
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10967
  format %{ "vpopcntd  $dst,$src\t! vector popcount packed16I" %}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10968
  ins_encode %{
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10969
    int vector_len = 2;
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10970
    __ vpopcntd($dst$$XMMRegister, $src$$XMMRegister, vector_len);
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10971
  %}
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10972
  ins_pipe( pipe_slow );
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48309
diff changeset
 10973
%}