src/hotspot/share/opto/regmask.cpp
author vdeshpande
Mon, 09 Jul 2018 13:25:08 -0700
changeset 51017 dd7ce84016a5
parent 47216 71c04702a3d5
child 53443 675d857f5ee3
permissions -rw-r--r--
8194740: UseSubwordForMaxVector causes performance regression Reviewed-by: kvn, thartmann
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
     1
/*
24424
2658d7834c6e 8037816: Fix for 8036122 breaks build with Xcode5/clang
drchase
parents: 22807
diff changeset
     2
 * Copyright (c) 1997, 2014, Oracle and/or its affiliates. All rights reserved.
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
     3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
489c9b5090e2 Initial load
duke
parents:
diff changeset
     4
 *
489c9b5090e2 Initial load
duke
parents:
diff changeset
     5
 * This code is free software; you can redistribute it and/or modify it
489c9b5090e2 Initial load
duke
parents:
diff changeset
     6
 * under the terms of the GNU General Public License version 2 only, as
489c9b5090e2 Initial load
duke
parents:
diff changeset
     7
 * published by the Free Software Foundation.
489c9b5090e2 Initial load
duke
parents:
diff changeset
     8
 *
489c9b5090e2 Initial load
duke
parents:
diff changeset
     9
 * This code is distributed in the hope that it will be useful, but WITHOUT
489c9b5090e2 Initial load
duke
parents:
diff changeset
    10
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
489c9b5090e2 Initial load
duke
parents:
diff changeset
    11
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
489c9b5090e2 Initial load
duke
parents:
diff changeset
    12
 * version 2 for more details (a copy is included in the LICENSE file that
489c9b5090e2 Initial load
duke
parents:
diff changeset
    13
 * accompanied this code).
489c9b5090e2 Initial load
duke
parents:
diff changeset
    14
 *
489c9b5090e2 Initial load
duke
parents:
diff changeset
    15
 * You should have received a copy of the GNU General Public License version
489c9b5090e2 Initial load
duke
parents:
diff changeset
    16
 * 2 along with this work; if not, write to the Free Software Foundation,
489c9b5090e2 Initial load
duke
parents:
diff changeset
    17
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
489c9b5090e2 Initial load
duke
parents:
diff changeset
    18
 *
5547
f4b087cbb361 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 1
diff changeset
    19
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
f4b087cbb361 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 1
diff changeset
    20
 * or visit www.oracle.com if you need additional information or have any
f4b087cbb361 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 1
diff changeset
    21
 * questions.
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    22
 *
489c9b5090e2 Initial load
duke
parents:
diff changeset
    23
 */
489c9b5090e2 Initial load
duke
parents:
diff changeset
    24
7397
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 5547
diff changeset
    25
#include "precompiled.hpp"
25715
d5a8dbdc5150 8049325: Introduce and clean up umbrella headers for the files in the cpu subdirectories.
goetz
parents: 24429
diff changeset
    26
#include "opto/ad.hpp"
7397
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 5547
diff changeset
    27
#include "opto/compile.hpp"
31620
53be635ad49c 8087333: Optionally Pre-Generate the HotSpot Template Interpreter
bdelsart
parents: 30624
diff changeset
    28
#include "opto/matcher.hpp"
53be635ad49c 8087333: Optionally Pre-Generate the HotSpot Template Interpreter
bdelsart
parents: 30624
diff changeset
    29
#include "opto/node.hpp"
7397
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 5547
diff changeset
    30
#include "opto/regmask.hpp"
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    31
489c9b5090e2 Initial load
duke
parents:
diff changeset
    32
#define RM_SIZE _RM_SIZE /* a constant private to the class RegMask */
489c9b5090e2 Initial load
duke
parents:
diff changeset
    33
489c9b5090e2 Initial load
duke
parents:
diff changeset
    34
//-------------Non-zero bit search methods used by RegMask---------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
    35
// Find lowest 1, or return 32 if empty
24425
53764d2358f9 8041415: remove port.{cpp,hpp} files
zgu
parents: 22807
diff changeset
    36
int find_lowest_bit( uint32_t mask ) {
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    37
  int n = 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    38
  if( (mask & 0xffff) == 0 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    39
    mask >>= 16;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    40
    n += 16;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    41
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    42
  if( (mask & 0xff) == 0 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    43
    mask >>= 8;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    44
    n += 8;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    45
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    46
  if( (mask & 0xf) == 0 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    47
    mask >>= 4;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    48
    n += 4;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    49
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    50
  if( (mask & 0x3) == 0 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    51
    mask >>= 2;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    52
    n += 2;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    53
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    54
  if( (mask & 0x1) == 0 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    55
    mask >>= 1;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    56
     n += 1;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    57
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    58
  if( mask == 0 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    59
    n = 32;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    60
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    61
  return n;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    62
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
    63
489c9b5090e2 Initial load
duke
parents:
diff changeset
    64
// Find highest 1, or return 32 if empty
24425
53764d2358f9 8041415: remove port.{cpp,hpp} files
zgu
parents: 22807
diff changeset
    65
int find_hihghest_bit( uint32_t mask ) {
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    66
  int n = 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    67
  if( mask > 0xffff ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    68
    mask >>= 16;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    69
    n += 16;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    70
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    71
  if( mask > 0xff ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    72
    mask >>= 8;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    73
    n += 8;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    74
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    75
  if( mask > 0xf ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    76
    mask >>= 4;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    77
    n += 4;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    78
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    79
  if( mask > 0x3 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    80
    mask >>= 2;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    81
    n += 2;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    82
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    83
  if( mask > 0x1 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    84
    mask >>= 1;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    85
    n += 1;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    86
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    87
  if( mask == 0 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    88
    n = 32;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    89
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    90
  return n;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    91
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
    92
489c9b5090e2 Initial load
duke
parents:
diff changeset
    93
//------------------------------dump-------------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
    94
489c9b5090e2 Initial load
duke
parents:
diff changeset
    95
#ifndef PRODUCT
15241
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
    96
void OptoReg::dump(int r, outputStream *st) {
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
    97
  switch (r) {
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
    98
  case Special: st->print("r---"); break;
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
    99
  case Bad:     st->print("rBAD"); break;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   100
  default:
24424
2658d7834c6e 8037816: Fix for 8036122 breaks build with Xcode5/clang
drchase
parents: 22807
diff changeset
   101
    if (r < _last_Mach_Reg) st->print("%s", Matcher::regName[r]);
15241
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   102
    else st->print("rS%d",r);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   103
    break;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   104
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   105
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   106
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
   107
489c9b5090e2 Initial load
duke
parents:
diff changeset
   108
489c9b5090e2 Initial load
duke
parents:
diff changeset
   109
//=============================================================================
489c9b5090e2 Initial load
duke
parents:
diff changeset
   110
const RegMask RegMask::Empty(
489c9b5090e2 Initial load
duke
parents:
diff changeset
   111
# define BODY(I) 0,
489c9b5090e2 Initial load
duke
parents:
diff changeset
   112
  FORALL_BODY
489c9b5090e2 Initial load
duke
parents:
diff changeset
   113
# undef BODY
489c9b5090e2 Initial load
duke
parents:
diff changeset
   114
  0
489c9b5090e2 Initial load
duke
parents:
diff changeset
   115
);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   116
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   117
//=============================================================================
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   118
bool RegMask::is_vector(uint ireg) {
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   119
  return (ireg == Op_VecS || ireg == Op_VecD ||
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   120
          ireg == Op_VecX || ireg == Op_VecY || ireg == Op_VecZ );
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   121
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   122
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   123
int RegMask::num_registers(uint ireg) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   124
    switch(ireg) {
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   125
      case Op_VecZ:
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   126
        return 16;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   127
      case Op_VecY:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   128
        return 8;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   129
      case Op_VecX:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   130
        return 4;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   131
      case Op_VecD:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   132
      case Op_RegD:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   133
      case Op_RegL:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   134
#ifdef _LP64
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   135
      case Op_RegP:
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   136
#endif
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   137
        return 2;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   138
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   139
    // Op_VecS and the rest ideal registers.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   140
    return 1;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   141
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   142
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   143
//------------------------------find_first_pair--------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   144
// Find the lowest-numbered register pair in the mask.  Return the
489c9b5090e2 Initial load
duke
parents:
diff changeset
   145
// HIGHEST register number in the pair, or BAD if no pairs.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   146
OptoReg::Name RegMask::find_first_pair() const {
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   147
  verify_pairs();
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   148
  for( int i = 0; i < RM_SIZE; i++ ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   149
    if( _A[i] ) {               // Found some bits
489c9b5090e2 Initial load
duke
parents:
diff changeset
   150
      int bit = _A[i] & -_A[i]; // Extract low bit
489c9b5090e2 Initial load
duke
parents:
diff changeset
   151
      // Convert to bit number, return hi bit in pair
489c9b5090e2 Initial load
duke
parents:
diff changeset
   152
      return OptoReg::Name((i<<_LogWordBits)+find_lowest_bit(bit)+1);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   153
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   154
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   155
  return OptoReg::Bad;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   156
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   157
489c9b5090e2 Initial load
duke
parents:
diff changeset
   158
//------------------------------ClearToPairs-----------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   159
// Clear out partial bits; leave only bit pairs
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   160
void RegMask::clear_to_pairs() {
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   161
  for( int i = 0; i < RM_SIZE; i++ ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   162
    int bits = _A[i];
489c9b5090e2 Initial load
duke
parents:
diff changeset
   163
    bits &= ((bits & 0x55555555)<<1); // 1 hi-bit set for each pair
489c9b5090e2 Initial load
duke
parents:
diff changeset
   164
    bits |= (bits>>1);          // Smear 1 hi-bit into a pair
489c9b5090e2 Initial load
duke
parents:
diff changeset
   165
    _A[i] = bits;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   166
  }
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   167
  verify_pairs();
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   168
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   169
489c9b5090e2 Initial load
duke
parents:
diff changeset
   170
//------------------------------SmearToPairs-----------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   171
// Smear out partial bits; leave only bit pairs
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   172
void RegMask::smear_to_pairs() {
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   173
  for( int i = 0; i < RM_SIZE; i++ ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   174
    int bits = _A[i];
489c9b5090e2 Initial load
duke
parents:
diff changeset
   175
    bits |= ((bits & 0x55555555)<<1); // Smear lo bit hi per pair
489c9b5090e2 Initial load
duke
parents:
diff changeset
   176
    bits |= ((bits & 0xAAAAAAAA)>>1); // Smear hi bit lo per pair
489c9b5090e2 Initial load
duke
parents:
diff changeset
   177
    _A[i] = bits;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   178
  }
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   179
  verify_pairs();
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   180
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   181
489c9b5090e2 Initial load
duke
parents:
diff changeset
   182
//------------------------------is_aligned_pairs-------------------------------
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   183
bool RegMask::is_aligned_pairs() const {
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   184
  // Assert that the register mask contains only bit pairs.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   185
  for( int i = 0; i < RM_SIZE; i++ ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   186
    int bits = _A[i];
489c9b5090e2 Initial load
duke
parents:
diff changeset
   187
    while( bits ) {             // Check bits for pairing
489c9b5090e2 Initial load
duke
parents:
diff changeset
   188
      int bit = bits & -bits;   // Extract low bit
489c9b5090e2 Initial load
duke
parents:
diff changeset
   189
      // Low bit is not odd means its mis-aligned.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   190
      if( (bit & 0x55555555) == 0 ) return false;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   191
      bits -= bit;              // Remove bit from mask
489c9b5090e2 Initial load
duke
parents:
diff changeset
   192
      // Check for aligned adjacent bit
489c9b5090e2 Initial load
duke
parents:
diff changeset
   193
      if( (bits & (bit<<1)) == 0 ) return false;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   194
      bits -= (bit<<1);         // Remove other halve of pair
489c9b5090e2 Initial load
duke
parents:
diff changeset
   195
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   196
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   197
  return true;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   198
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   199
489c9b5090e2 Initial load
duke
parents:
diff changeset
   200
//------------------------------is_bound1--------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   201
// Return TRUE if the mask contains a single bit
489c9b5090e2 Initial load
duke
parents:
diff changeset
   202
int RegMask::is_bound1() const {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   203
  if( is_AllStack() ) return false;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   204
  int bit = -1;                 // Set to hold the one bit allowed
489c9b5090e2 Initial load
duke
parents:
diff changeset
   205
  for( int i = 0; i < RM_SIZE; i++ ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   206
    if( _A[i] ) {               // Found some bits
489c9b5090e2 Initial load
duke
parents:
diff changeset
   207
      if( bit != -1 ) return false; // Already had bits, so fail
489c9b5090e2 Initial load
duke
parents:
diff changeset
   208
      bit = _A[i] & -_A[i];     // Extract 1 bit from mask
489c9b5090e2 Initial load
duke
parents:
diff changeset
   209
      if( bit != _A[i] ) return false; // Found many bits, so fail
489c9b5090e2 Initial load
duke
parents:
diff changeset
   210
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   211
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   212
  // True for both the empty mask and for a single bit
489c9b5090e2 Initial load
duke
parents:
diff changeset
   213
  return true;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   214
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   215
489c9b5090e2 Initial load
duke
parents:
diff changeset
   216
//------------------------------is_bound2--------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   217
// Return TRUE if the mask contains an adjacent pair of bits and no other bits.
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   218
int RegMask::is_bound_pair() const {
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   219
  if( is_AllStack() ) return false;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   220
489c9b5090e2 Initial load
duke
parents:
diff changeset
   221
  int bit = -1;                 // Set to hold the one bit allowed
489c9b5090e2 Initial load
duke
parents:
diff changeset
   222
  for( int i = 0; i < RM_SIZE; i++ ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   223
    if( _A[i] ) {               // Found some bits
489c9b5090e2 Initial load
duke
parents:
diff changeset
   224
      if( bit != -1 ) return false; // Already had bits, so fail
489c9b5090e2 Initial load
duke
parents:
diff changeset
   225
      bit = _A[i] & -(_A[i]);   // Extract 1 bit from mask
489c9b5090e2 Initial load
duke
parents:
diff changeset
   226
      if( (bit << 1) != 0 ) {   // Bit pair stays in same word?
489c9b5090e2 Initial load
duke
parents:
diff changeset
   227
        if( (bit | (bit<<1)) != _A[i] )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   228
          return false;         // Require adjacent bit pair and no more bits
489c9b5090e2 Initial load
duke
parents:
diff changeset
   229
      } else {                  // Else its a split-pair case
489c9b5090e2 Initial load
duke
parents:
diff changeset
   230
        if( bit != _A[i] ) return false; // Found many bits, so fail
489c9b5090e2 Initial load
duke
parents:
diff changeset
   231
        i++;                    // Skip iteration forward
15614
3d9afca22dc7 8007402: Code cleanup to remove Parfait false positive
drchase
parents: 15241
diff changeset
   232
        if( i >= RM_SIZE || _A[i] != 1 )
3d9afca22dc7 8007402: Code cleanup to remove Parfait false positive
drchase
parents: 15241
diff changeset
   233
          return false; // Require 1 lo bit in next word
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   234
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   235
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   236
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   237
  // True for both the empty mask and for a bit pair
489c9b5090e2 Initial load
duke
parents:
diff changeset
   238
  return true;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   239
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   240
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   241
// only indicies of power 2 are accessed, so index 3 is only filled in for storage.
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   242
static int low_bits[5] = { 0x55555555, 0x11111111, 0x01010101, 0x00000000, 0x00010001 };
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   243
//------------------------------find_first_set---------------------------------
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   244
// Find the lowest-numbered register set in the mask.  Return the
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   245
// HIGHEST register number in the set, or BAD if no sets.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   246
// Works also for size 1.
15614
3d9afca22dc7 8007402: Code cleanup to remove Parfait false positive
drchase
parents: 15241
diff changeset
   247
OptoReg::Name RegMask::find_first_set(const int size) const {
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   248
  verify_sets(size);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   249
  for (int i = 0; i < RM_SIZE; i++) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   250
    if (_A[i]) {                // Found some bits
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   251
      int bit = _A[i] & -_A[i]; // Extract low bit
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   252
      // Convert to bit number, return hi bit in pair
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   253
      return OptoReg::Name((i<<_LogWordBits)+find_lowest_bit(bit)+(size-1));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   254
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   255
  }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   256
  return OptoReg::Bad;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   257
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   258
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   259
//------------------------------clear_to_sets----------------------------------
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   260
// Clear out partial bits; leave only aligned adjacent bit pairs
15614
3d9afca22dc7 8007402: Code cleanup to remove Parfait false positive
drchase
parents: 15241
diff changeset
   261
void RegMask::clear_to_sets(const int size) {
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   262
  if (size == 1) return;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   263
  assert(2 <= size && size <= 16, "update low bits table");
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   264
  assert(is_power_of_2(size), "sanity");
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   265
  int low_bits_mask = low_bits[size>>2];
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   266
  for (int i = 0; i < RM_SIZE; i++) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   267
    int bits = _A[i];
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   268
    int sets = (bits & low_bits_mask);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   269
    for (int j = 1; j < size; j++) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   270
      sets = (bits & (sets<<1)); // filter bits which produce whole sets
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   271
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   272
    sets |= (sets>>1);           // Smear 1 hi-bit into a set
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   273
    if (size > 2) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   274
      sets |= (sets>>2);         // Smear 2 hi-bits into a set
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   275
      if (size > 4) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   276
        sets |= (sets>>4);       // Smear 4 hi-bits into a set
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   277
        if (size > 8) {
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   278
          sets |= (sets>>8);     // Smear 8 hi-bits into a set
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   279
        }
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   280
      }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   281
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   282
    _A[i] = sets;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   283
  }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   284
  verify_sets(size);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   285
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   286
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   287
//------------------------------smear_to_sets----------------------------------
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   288
// Smear out partial bits to aligned adjacent bit sets
15614
3d9afca22dc7 8007402: Code cleanup to remove Parfait false positive
drchase
parents: 15241
diff changeset
   289
void RegMask::smear_to_sets(const int size) {
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   290
  if (size == 1) return;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   291
  assert(2 <= size && size <= 16, "update low bits table");
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   292
  assert(is_power_of_2(size), "sanity");
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   293
  int low_bits_mask = low_bits[size>>2];
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   294
  for (int i = 0; i < RM_SIZE; i++) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   295
    int bits = _A[i];
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   296
    int sets = 0;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   297
    for (int j = 0; j < size; j++) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   298
      sets |= (bits & low_bits_mask);  // collect partial bits
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   299
      bits  = bits>>1;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   300
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   301
    sets |= (sets<<1);           // Smear 1 lo-bit  into a set
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   302
    if (size > 2) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   303
      sets |= (sets<<2);         // Smear 2 lo-bits into a set
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   304
      if (size > 4) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   305
        sets |= (sets<<4);       // Smear 4 lo-bits into a set
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   306
        if (size > 8) {
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   307
          sets |= (sets<<8);     // Smear 8 lo-bits into a set
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   308
        }
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   309
      }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   310
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   311
    _A[i] = sets;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   312
  }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   313
  verify_sets(size);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   314
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   315
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   316
//------------------------------is_aligned_set--------------------------------
15614
3d9afca22dc7 8007402: Code cleanup to remove Parfait false positive
drchase
parents: 15241
diff changeset
   317
bool RegMask::is_aligned_sets(const int size) const {
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   318
  if (size == 1) return true;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   319
  assert(2 <= size && size <= 16, "update low bits table");
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   320
  assert(is_power_of_2(size), "sanity");
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   321
  int low_bits_mask = low_bits[size>>2];
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   322
  // Assert that the register mask contains only bit sets.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   323
  for (int i = 0; i < RM_SIZE; i++) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   324
    int bits = _A[i];
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   325
    while (bits) {              // Check bits for pairing
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   326
      int bit = bits & -bits;   // Extract low bit
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   327
      // Low bit is not odd means its mis-aligned.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   328
      if ((bit & low_bits_mask) == 0) return false;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   329
      // Do extra work since (bit << size) may overflow.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   330
      int hi_bit = bit << (size-1); // high bit
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   331
      int set = hi_bit + ((hi_bit-1) & ~(bit-1));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   332
      // Check for aligned adjacent bits in this set
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   333
      if ((bits & set) != set) return false;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   334
      bits -= set;  // Remove this set
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   335
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   336
  }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   337
  return true;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   338
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   339
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   340
//------------------------------is_bound_set-----------------------------------
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   341
// Return TRUE if the mask contains one adjacent set of bits and no other bits.
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   342
// Works also for size 1.
15614
3d9afca22dc7 8007402: Code cleanup to remove Parfait false positive
drchase
parents: 15241
diff changeset
   343
int RegMask::is_bound_set(const int size) const {
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   344
  if( is_AllStack() ) return false;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   345
  assert(1 <= size && size <= 16, "update low bits table");
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   346
  int bit = -1;                 // Set to hold the one bit allowed
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   347
  for (int i = 0; i < RM_SIZE; i++) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   348
    if (_A[i] ) {               // Found some bits
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   349
      if (bit != -1)
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   350
       return false;            // Already had bits, so fail
15614
3d9afca22dc7 8007402: Code cleanup to remove Parfait false positive
drchase
parents: 15241
diff changeset
   351
      bit = _A[i] & -_A[i];     // Extract low bit from mask
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   352
      int hi_bit = bit << (size-1); // high bit
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   353
      if (hi_bit != 0) {        // Bit set stays in same word?
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   354
        int set = hi_bit + ((hi_bit-1) & ~(bit-1));
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   355
        if (set != _A[i])
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   356
          return false;         // Require adjacent bit set and no more bits
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   357
      } else {                  // Else its a split-set case
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   358
        if (((-1) & ~(bit-1)) != _A[i])
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   359
          return false;         // Found many bits, so fail
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   360
        i++;                    // Skip iteration forward and check high part
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   361
        // The lower (32-size) bits should be 0 since it is split case.
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   362
        int clear_bit_size = 32-size;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   363
        int shift_back_size = 32-clear_bit_size;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   364
        int set = bit>>clear_bit_size;
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   365
        set = set & -set; // Remove sign extension.
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 25715
diff changeset
   366
        set = (((set << size) - 1) >> shift_back_size);
15614
3d9afca22dc7 8007402: Code cleanup to remove Parfait false positive
drchase
parents: 15241
diff changeset
   367
        if (i >= RM_SIZE || _A[i] != set)
3d9afca22dc7 8007402: Code cleanup to remove Parfait false positive
drchase
parents: 15241
diff changeset
   368
          return false; // Require expected low bits in next word
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   369
      }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   370
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   371
  }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   372
  // True for both the empty mask and for a bit set
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   373
  return true;
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   374
}
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 8921
diff changeset
   375
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   376
//------------------------------is_UP------------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   377
// UP means register only, Register plus stack, or stack only is DOWN
489c9b5090e2 Initial load
duke
parents:
diff changeset
   378
bool RegMask::is_UP() const {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   379
  // Quick common case check for DOWN (any stack slot is legal)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   380
  if( is_AllStack() )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   381
    return false;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   382
  // Slower check for any stack bits set (also DOWN)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   383
  if( overlap(Matcher::STACK_ONLY_mask) )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   384
    return false;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   385
  // Not DOWN, so must be UP
489c9b5090e2 Initial load
duke
parents:
diff changeset
   386
  return true;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   387
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   388
489c9b5090e2 Initial load
duke
parents:
diff changeset
   389
//------------------------------Size-------------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   390
// Compute size of register mask in bits
489c9b5090e2 Initial load
duke
parents:
diff changeset
   391
uint RegMask::Size() const {
38022
342a29d198d8 8149488: Incorrect declaration of bitsInByte in regmask.cpp.
rraghavan
parents: 31620
diff changeset
   392
  extern uint8_t bitsInByte[BITS_IN_BYTE_ARRAY_SIZE];
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   393
  uint sum = 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   394
  for( int i = 0; i < RM_SIZE; i++ )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   395
    sum +=
489c9b5090e2 Initial load
duke
parents:
diff changeset
   396
      bitsInByte[(_A[i]>>24) & 0xff] +
489c9b5090e2 Initial load
duke
parents:
diff changeset
   397
      bitsInByte[(_A[i]>>16) & 0xff] +
489c9b5090e2 Initial load
duke
parents:
diff changeset
   398
      bitsInByte[(_A[i]>> 8) & 0xff] +
489c9b5090e2 Initial load
duke
parents:
diff changeset
   399
      bitsInByte[ _A[i]      & 0xff];
489c9b5090e2 Initial load
duke
parents:
diff changeset
   400
  return sum;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   401
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   402
489c9b5090e2 Initial load
duke
parents:
diff changeset
   403
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
   404
//------------------------------print------------------------------------------
15241
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   405
void RegMask::dump(outputStream *st) const {
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   406
  st->print("[");
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   407
  RegMask rm = *this;           // Structure copy into local temp
489c9b5090e2 Initial load
duke
parents:
diff changeset
   408
489c9b5090e2 Initial load
duke
parents:
diff changeset
   409
  OptoReg::Name start = rm.find_first_elem(); // Get a register
15241
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   410
  if (OptoReg::is_valid(start)) { // Check for empty mask
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   411
    rm.Remove(start);           // Yank from mask
15241
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   412
    OptoReg::dump(start, st);   // Print register
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   413
    OptoReg::Name last = start;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   414
489c9b5090e2 Initial load
duke
parents:
diff changeset
   415
    // Now I have printed an initial register.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   416
    // Print adjacent registers as "rX-rZ" instead of "rX,rY,rZ".
489c9b5090e2 Initial load
duke
parents:
diff changeset
   417
    // Begin looping over the remaining registers.
15241
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   418
    while (1) {                 //
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   419
      OptoReg::Name reg = rm.find_first_elem(); // Get a register
15241
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   420
      if (!OptoReg::is_valid(reg))
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   421
        break;                  // Empty mask, end loop
489c9b5090e2 Initial load
duke
parents:
diff changeset
   422
      rm.Remove(reg);           // Yank from mask
489c9b5090e2 Initial load
duke
parents:
diff changeset
   423
15241
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   424
      if (last+1 == reg) {      // See if they are adjacent
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   425
        // Adjacent registers just collect into long runs, no printing.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   426
        last = reg;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   427
      } else {                  // Ending some kind of run
15241
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   428
        if (start == last) {    // 1-register run; no special printing
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   429
        } else if (start+1 == last) {
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   430
          st->print(",");       // 2-register run; print as "rX,rY"
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   431
          OptoReg::dump(last, st);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   432
        } else {                // Multi-register run; print as "rX-rZ"
15241
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   433
          st->print("-");
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   434
          OptoReg::dump(last, st);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   435
        }
15241
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   436
        st->print(",");         // Seperate start of new run
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   437
        start = last = reg;     // Start a new register run
15241
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   438
        OptoReg::dump(start, st); // Print register
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   439
      } // End of if ending a register run or not
489c9b5090e2 Initial load
duke
parents:
diff changeset
   440
    } // End of while regmask not empty
489c9b5090e2 Initial load
duke
parents:
diff changeset
   441
15241
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   442
    if (start == last) {        // 1-register run; no special printing
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   443
    } else if (start+1 == last) {
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   444
      st->print(",");           // 2-register run; print as "rX,rY"
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   445
      OptoReg::dump(last, st);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   446
    } else {                    // Multi-register run; print as "rX-rZ"
15241
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   447
      st->print("-");
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   448
      OptoReg::dump(last, st);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   449
    }
15241
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   450
    if (rm.is_AllStack()) st->print("...");
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   451
  }
15241
87d217c2d183 8005055: pass outputStream to more opto debug routines
kvn
parents: 13104
diff changeset
   452
  st->print("]");
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   453
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   454
#endif