hotspot/src/share/vm/opto/divnode.cpp
author kvn
Tue, 02 Nov 2010 09:00:37 -0700
changeset 7115 32300e243300
parent 5547 f4b087cbb361
child 7397 5b173b4ca846
permissions -rw-r--r--
6987135: Performance regression on Intel platform with 32-bits edition between 6u13 and 6u14. Summary: Use hardware DIV instruction for long division by constant when it is faster than code with multiply. Reviewed-by: never
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
     1
/*
7115
32300e243300 6987135: Performance regression on Intel platform with 32-bits edition between 6u13 and 6u14.
kvn
parents: 5547
diff changeset
     2
 * Copyright (c) 1997, 2010, Oracle and/or its affiliates. All rights reserved.
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
     3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
489c9b5090e2 Initial load
duke
parents:
diff changeset
     4
 *
489c9b5090e2 Initial load
duke
parents:
diff changeset
     5
 * This code is free software; you can redistribute it and/or modify it
489c9b5090e2 Initial load
duke
parents:
diff changeset
     6
 * under the terms of the GNU General Public License version 2 only, as
489c9b5090e2 Initial load
duke
parents:
diff changeset
     7
 * published by the Free Software Foundation.
489c9b5090e2 Initial load
duke
parents:
diff changeset
     8
 *
489c9b5090e2 Initial load
duke
parents:
diff changeset
     9
 * This code is distributed in the hope that it will be useful, but WITHOUT
489c9b5090e2 Initial load
duke
parents:
diff changeset
    10
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
489c9b5090e2 Initial load
duke
parents:
diff changeset
    11
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
489c9b5090e2 Initial load
duke
parents:
diff changeset
    12
 * version 2 for more details (a copy is included in the LICENSE file that
489c9b5090e2 Initial load
duke
parents:
diff changeset
    13
 * accompanied this code).
489c9b5090e2 Initial load
duke
parents:
diff changeset
    14
 *
489c9b5090e2 Initial load
duke
parents:
diff changeset
    15
 * You should have received a copy of the GNU General Public License version
489c9b5090e2 Initial load
duke
parents:
diff changeset
    16
 * 2 along with this work; if not, write to the Free Software Foundation,
489c9b5090e2 Initial load
duke
parents:
diff changeset
    17
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
489c9b5090e2 Initial load
duke
parents:
diff changeset
    18
 *
5547
f4b087cbb361 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 4583
diff changeset
    19
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
f4b087cbb361 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 4583
diff changeset
    20
 * or visit www.oracle.com if you need additional information or have any
f4b087cbb361 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 4583
diff changeset
    21
 * questions.
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    22
 *
489c9b5090e2 Initial load
duke
parents:
diff changeset
    23
 */
489c9b5090e2 Initial load
duke
parents:
diff changeset
    24
489c9b5090e2 Initial load
duke
parents:
diff changeset
    25
// Portions of code courtesy of Clifford Click
489c9b5090e2 Initial load
duke
parents:
diff changeset
    26
489c9b5090e2 Initial load
duke
parents:
diff changeset
    27
// Optimization - Graph Style
489c9b5090e2 Initial load
duke
parents:
diff changeset
    28
489c9b5090e2 Initial load
duke
parents:
diff changeset
    29
#include "incls/_precompiled.incl"
489c9b5090e2 Initial load
duke
parents:
diff changeset
    30
#include "incls/_divnode.cpp.incl"
489c9b5090e2 Initial load
duke
parents:
diff changeset
    31
#include <math.h>
489c9b5090e2 Initial load
duke
parents:
diff changeset
    32
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    33
//----------------------magic_int_divide_constants-----------------------------
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    34
// Compute magic multiplier and shift constant for converting a 32 bit divide
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    35
// by constant into a multiply/shift/add series. Return false if calculations
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    36
// fail.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    37
//
2131
98f9cef66a34 6810672: Comment typos
twisti
parents: 2032
diff changeset
    38
// Borrowed almost verbatim from Hacker's Delight by Henry S. Warren, Jr. with
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    39
// minor type name and parameter changes.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    40
static bool magic_int_divide_constants(jint d, jint &M, jint &s) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    41
  int32_t p;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    42
  uint32_t ad, anc, delta, q1, r1, q2, r2, t;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    43
  const uint32_t two31 = 0x80000000L;     // 2**31.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    44
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    45
  ad = ABS(d);
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    46
  if (d == 0 || d == 1) return false;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    47
  t = two31 + ((uint32_t)d >> 31);
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    48
  anc = t - 1 - t%ad;     // Absolute value of nc.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    49
  p = 31;                 // Init. p.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    50
  q1 = two31/anc;         // Init. q1 = 2**p/|nc|.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    51
  r1 = two31 - q1*anc;    // Init. r1 = rem(2**p, |nc|).
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    52
  q2 = two31/ad;          // Init. q2 = 2**p/|d|.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    53
  r2 = two31 - q2*ad;     // Init. r2 = rem(2**p, |d|).
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    54
  do {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    55
    p = p + 1;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    56
    q1 = 2*q1;            // Update q1 = 2**p/|nc|.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    57
    r1 = 2*r1;            // Update r1 = rem(2**p, |nc|).
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    58
    if (r1 >= anc) {      // (Must be an unsigned
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    59
      q1 = q1 + 1;        // comparison here).
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    60
      r1 = r1 - anc;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    61
    }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    62
    q2 = 2*q2;            // Update q2 = 2**p/|d|.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    63
    r2 = 2*r2;            // Update r2 = rem(2**p, |d|).
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    64
    if (r2 >= ad) {       // (Must be an unsigned
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    65
      q2 = q2 + 1;        // comparison here).
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    66
      r2 = r2 - ad;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    67
    }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    68
    delta = ad - r2;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    69
  } while (q1 < delta || (q1 == delta && r1 == 0));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    70
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    71
  M = q2 + 1;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    72
  if (d < 0) M = -M;      // Magic number and
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    73
  s = p - 32;             // shift amount to return.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    74
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    75
  return true;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    76
}
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    77
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    78
//--------------------------transform_int_divide-------------------------------
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    79
// Convert a division by constant divisor into an alternate Ideal graph.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    80
// Return NULL if no transformation occurs.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    81
static Node *transform_int_divide( PhaseGVN *phase, Node *dividend, jint divisor ) {
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    82
489c9b5090e2 Initial load
duke
parents:
diff changeset
    83
  // Check for invalid divisors
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    84
  assert( divisor != 0 && divisor != min_jint,
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    85
          "bad divisor for transforming to long multiply" );
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    86
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    87
  bool d_pos = divisor >= 0;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    88
  jint d = d_pos ? divisor : -divisor;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    89
  const int N = 32;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    90
489c9b5090e2 Initial load
duke
parents:
diff changeset
    91
  // Result
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    92
  Node *q = NULL;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    93
489c9b5090e2 Initial load
duke
parents:
diff changeset
    94
  if (d == 1) {
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    95
    // division by +/- 1
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    96
    if (!d_pos) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
    97
      // Just negate the value
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    98
      q = new (phase->C, 3) SubINode(phase->intcon(0), dividend);
489c9b5090e2 Initial load
duke
parents:
diff changeset
    99
    }
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   100
  } else if ( is_power_of_2(d) ) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   101
    // division by +/- a power of 2
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   102
489c9b5090e2 Initial load
duke
parents:
diff changeset
   103
    // See if we can simply do a shift without rounding
489c9b5090e2 Initial load
duke
parents:
diff changeset
   104
    bool needs_rounding = true;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   105
    const Type *dt = phase->type(dividend);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   106
    const TypeInt *dti = dt->isa_int();
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   107
    if (dti && dti->_lo >= 0) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   108
      // we don't need to round a positive dividend
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   109
      needs_rounding = false;
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   110
    } else if( dividend->Opcode() == Op_AndI ) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   111
      // An AND mask of sufficient size clears the low bits and
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   112
      // I can avoid rounding.
1432
44f076e3d2a4 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 1067
diff changeset
   113
      const TypeInt *andconi_t = phase->type( dividend->in(2) )->isa_int();
44f076e3d2a4 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 1067
diff changeset
   114
      if( andconi_t && andconi_t->is_con() ) {
44f076e3d2a4 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 1067
diff changeset
   115
        jint andconi = andconi_t->get_con();
44f076e3d2a4 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 1067
diff changeset
   116
        if( andconi < 0 && is_power_of_2(-andconi) && (-andconi) >= d ) {
4583
b36d52bd2d19 6910484: incorrect integer optimization (loosing and op-r in a given example)
kvn
parents: 2746
diff changeset
   117
          if( (-andconi) == d ) // Remove AND if it clears bits which will be shifted
b36d52bd2d19 6910484: incorrect integer optimization (loosing and op-r in a given example)
kvn
parents: 2746
diff changeset
   118
            dividend = dividend->in(1);
1432
44f076e3d2a4 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 1067
diff changeset
   119
          needs_rounding = false;
44f076e3d2a4 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 1067
diff changeset
   120
        }
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   121
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   122
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   123
489c9b5090e2 Initial load
duke
parents:
diff changeset
   124
    // Add rounding to the shift to handle the sign bit
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   125
    int l = log2_intptr(d-1)+1;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   126
    if (needs_rounding) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   127
      // Divide-by-power-of-2 can be made into a shift, but you have to do
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   128
      // more math for the rounding.  You need to add 0 for positive
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   129
      // numbers, and "i-1" for negative numbers.  Example: i=4, so the
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   130
      // shift is by 2.  You need to add 3 to negative dividends and 0 to
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   131
      // positive ones.  So (-7+3)>>2 becomes -1, (-4+3)>>2 becomes -1,
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   132
      // (-2+3)>>2 becomes 0, etc.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   133
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   134
      // Compute 0 or -1, based on sign bit
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   135
      Node *sign = phase->transform(new (phase->C, 3) RShiftINode(dividend, phase->intcon(N - 1)));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   136
      // Mask sign bit to the low sign bits
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   137
      Node *round = phase->transform(new (phase->C, 3) URShiftINode(sign, phase->intcon(N - l)));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   138
      // Round up before shifting
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   139
      dividend = phase->transform(new (phase->C, 3) AddINode(dividend, round));
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   140
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   141
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   142
    // Shift for division
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   143
    q = new (phase->C, 3) RShiftINode(dividend, phase->intcon(l));
489c9b5090e2 Initial load
duke
parents:
diff changeset
   144
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   145
    if (!d_pos) {
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   146
      q = new (phase->C, 3) SubINode(phase->intcon(0), phase->transform(q));
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   147
    }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   148
  } else {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   149
    // Attempt the jint constant divide -> multiply transform found in
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   150
    //   "Division by Invariant Integers using Multiplication"
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   151
    //     by Granlund and Montgomery
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   152
    // See also "Hacker's Delight", chapter 10 by Warren.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   153
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   154
    jint magic_const;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   155
    jint shift_const;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   156
    if (magic_int_divide_constants(d, magic_const, shift_const)) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   157
      Node *magic = phase->longcon(magic_const);
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   158
      Node *dividend_long = phase->transform(new (phase->C, 2) ConvI2LNode(dividend));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   159
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   160
      // Compute the high half of the dividend x magic multiplication
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   161
      Node *mul_hi = phase->transform(new (phase->C, 3) MulLNode(dividend_long, magic));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   162
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   163
      if (magic_const < 0) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   164
        mul_hi = phase->transform(new (phase->C, 3) RShiftLNode(mul_hi, phase->intcon(N)));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   165
        mul_hi = phase->transform(new (phase->C, 2) ConvL2INode(mul_hi));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   166
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   167
        // The magic multiplier is too large for a 32 bit constant. We've adjusted
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   168
        // it down by 2^32, but have to add 1 dividend back in after the multiplication.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   169
        // This handles the "overflow" case described by Granlund and Montgomery.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   170
        mul_hi = phase->transform(new (phase->C, 3) AddINode(dividend, mul_hi));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   171
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   172
        // Shift over the (adjusted) mulhi
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   173
        if (shift_const != 0) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   174
          mul_hi = phase->transform(new (phase->C, 3) RShiftINode(mul_hi, phase->intcon(shift_const)));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   175
        }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   176
      } else {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   177
        // No add is required, we can merge the shifts together.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   178
        mul_hi = phase->transform(new (phase->C, 3) RShiftLNode(mul_hi, phase->intcon(N + shift_const)));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   179
        mul_hi = phase->transform(new (phase->C, 2) ConvL2INode(mul_hi));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   180
      }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   181
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   182
      // Get a 0 or -1 from the sign of the dividend.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   183
      Node *addend0 = mul_hi;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   184
      Node *addend1 = phase->transform(new (phase->C, 3) RShiftINode(dividend, phase->intcon(N-1)));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   185
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   186
      // If the divisor is negative, swap the order of the input addends;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   187
      // this has the effect of negating the quotient.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   188
      if (!d_pos) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   189
        Node *temp = addend0; addend0 = addend1; addend1 = temp;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   190
      }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   191
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   192
      // Adjust the final quotient by subtracting -1 (adding 1)
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   193
      // from the mul_hi.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   194
      q = new (phase->C, 3) SubINode(addend0, addend1);
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   195
    }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   196
  }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   197
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   198
  return q;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   199
}
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   200
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   201
//---------------------magic_long_divide_constants-----------------------------
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   202
// Compute magic multiplier and shift constant for converting a 64 bit divide
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   203
// by constant into a multiply/shift/add series. Return false if calculations
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   204
// fail.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   205
//
2131
98f9cef66a34 6810672: Comment typos
twisti
parents: 2032
diff changeset
   206
// Borrowed almost verbatim from Hacker's Delight by Henry S. Warren, Jr. with
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   207
// minor type name and parameter changes.  Adjusted to 64 bit word width.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   208
static bool magic_long_divide_constants(jlong d, jlong &M, jint &s) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   209
  int64_t p;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   210
  uint64_t ad, anc, delta, q1, r1, q2, r2, t;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   211
  const uint64_t two63 = 0x8000000000000000LL;     // 2**63.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   212
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   213
  ad = ABS(d);
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   214
  if (d == 0 || d == 1) return false;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   215
  t = two63 + ((uint64_t)d >> 63);
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   216
  anc = t - 1 - t%ad;     // Absolute value of nc.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   217
  p = 63;                 // Init. p.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   218
  q1 = two63/anc;         // Init. q1 = 2**p/|nc|.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   219
  r1 = two63 - q1*anc;    // Init. r1 = rem(2**p, |nc|).
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   220
  q2 = two63/ad;          // Init. q2 = 2**p/|d|.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   221
  r2 = two63 - q2*ad;     // Init. r2 = rem(2**p, |d|).
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   222
  do {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   223
    p = p + 1;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   224
    q1 = 2*q1;            // Update q1 = 2**p/|nc|.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   225
    r1 = 2*r1;            // Update r1 = rem(2**p, |nc|).
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   226
    if (r1 >= anc) {      // (Must be an unsigned
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   227
      q1 = q1 + 1;        // comparison here).
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   228
      r1 = r1 - anc;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   229
    }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   230
    q2 = 2*q2;            // Update q2 = 2**p/|d|.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   231
    r2 = 2*r2;            // Update r2 = rem(2**p, |d|).
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   232
    if (r2 >= ad) {       // (Must be an unsigned
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   233
      q2 = q2 + 1;        // comparison here).
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   234
      r2 = r2 - ad;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   235
    }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   236
    delta = ad - r2;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   237
  } while (q1 < delta || (q1 == delta && r1 == 0));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   238
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   239
  M = q2 + 1;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   240
  if (d < 0) M = -M;      // Magic number and
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   241
  s = p - 64;             // shift amount to return.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   242
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   243
  return true;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   244
}
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   245
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   246
//---------------------long_by_long_mulhi--------------------------------------
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   247
// Generate ideal node graph for upper half of a 64 bit x 64 bit multiplication
2031
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   248
static Node* long_by_long_mulhi(PhaseGVN* phase, Node* dividend, jlong magic_const) {
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   249
  // If the architecture supports a 64x64 mulhi, there is
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   250
  // no need to synthesize it in ideal nodes.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   251
  if (Matcher::has_match_rule(Op_MulHiL)) {
2031
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   252
    Node* v = phase->longcon(magic_const);
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   253
    return new (phase->C, 3) MulHiLNode(dividend, v);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   254
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   255
2031
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   256
  // Taken from Hacker's Delight, Fig. 8-2. Multiply high signed.
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   257
  // (http://www.hackersdelight.org/HDcode/mulhs.c)
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   258
  //
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   259
  // int mulhs(int u, int v) {
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   260
  //    unsigned u0, v0, w0;
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   261
  //    int u1, v1, w1, w2, t;
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   262
  //
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   263
  //    u0 = u & 0xFFFF;  u1 = u >> 16;
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   264
  //    v0 = v & 0xFFFF;  v1 = v >> 16;
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   265
  //    w0 = u0*v0;
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   266
  //    t  = u1*v0 + (w0 >> 16);
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   267
  //    w1 = t & 0xFFFF;
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   268
  //    w2 = t >> 16;
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   269
  //    w1 = u0*v1 + w1;
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   270
  //    return u1*v1 + w2 + (w1 >> 16);
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   271
  // }
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   272
  //
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   273
  // Note: The version above is for 32x32 multiplications, while the
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   274
  // following inline comments are adapted to 64x64.
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   275
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   276
  const int N = 64;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   277
2031
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   278
  // u0 = u & 0xFFFFFFFF;  u1 = u >> 32;
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   279
  Node* u0 = phase->transform(new (phase->C, 3) AndLNode(dividend, phase->longcon(0xFFFFFFFF)));
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   280
  Node* u1 = phase->transform(new (phase->C, 3) RShiftLNode(dividend, phase->intcon(N / 2)));
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   281
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   282
  // v0 = v & 0xFFFFFFFF;  v1 = v >> 32;
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   283
  Node* v0 = phase->longcon(magic_const & 0xFFFFFFFF);
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   284
  Node* v1 = phase->longcon(magic_const >> (N / 2));
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   285
2031
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   286
  // w0 = u0*v0;
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   287
  Node* w0 = phase->transform(new (phase->C, 3) MulLNode(u0, v0));
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   288
2031
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   289
  // t = u1*v0 + (w0 >> 32);
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   290
  Node* u1v0 = phase->transform(new (phase->C, 3) MulLNode(u1, v0));
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   291
  Node* temp = phase->transform(new (phase->C, 3) URShiftLNode(w0, phase->intcon(N / 2)));
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   292
  Node* t    = phase->transform(new (phase->C, 3) AddLNode(u1v0, temp));
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   293
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   294
  // w1 = t & 0xFFFFFFFF;
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   295
  Node* w1 = new (phase->C, 3) AndLNode(t, phase->longcon(0xFFFFFFFF));
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   296
2031
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   297
  // w2 = t >> 32;
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   298
  Node* w2 = new (phase->C, 3) RShiftLNode(t, phase->intcon(N / 2));
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   299
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   300
  // 6732154: Construct both w1 and w2 before transforming, so t
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   301
  // doesn't go dead prematurely.
2746
825bfb41920c 6837011: SIGSEGV in PhaseIdealLoop in 32bit jvm
twisti
parents: 2131
diff changeset
   302
  // 6837011: We need to transform w2 before w1 because the
825bfb41920c 6837011: SIGSEGV in PhaseIdealLoop in 32bit jvm
twisti
parents: 2131
diff changeset
   303
  // transformation of w1 could return t.
825bfb41920c 6837011: SIGSEGV in PhaseIdealLoop in 32bit jvm
twisti
parents: 2131
diff changeset
   304
  w2 = phase->transform(w2);
2031
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   305
  w1 = phase->transform(w1);
1056
da0241911ea8 6732154: REG: Printing an Image using image/gif doc flavor crashes the VM, Solsparc
rasbold
parents: 670
diff changeset
   306
2031
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   307
  // w1 = u0*v1 + w1;
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   308
  Node* u0v1 = phase->transform(new (phase->C, 3) MulLNode(u0, v1));
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   309
  w1         = phase->transform(new (phase->C, 3) AddLNode(u0v1, w1));
1056
da0241911ea8 6732154: REG: Printing an Image using image/gif doc flavor crashes the VM, Solsparc
rasbold
parents: 670
diff changeset
   310
2031
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   311
  // return u1*v1 + w2 + (w1 >> 32);
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   312
  Node* u1v1  = phase->transform(new (phase->C, 3) MulLNode(u1, v1));
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   313
  Node* temp1 = phase->transform(new (phase->C, 3) AddLNode(u1v1, w2));
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   314
  Node* temp2 = phase->transform(new (phase->C, 3) RShiftLNode(w1, phase->intcon(N / 2)));
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   315
2031
24e034f56dcb 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 1436
diff changeset
   316
  return new (phase->C, 3) AddLNode(temp1, temp2);
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   317
}
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   318
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   319
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   320
//--------------------------transform_long_divide------------------------------
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   321
// Convert a division by constant divisor into an alternate Ideal graph.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   322
// Return NULL if no transformation occurs.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   323
static Node *transform_long_divide( PhaseGVN *phase, Node *dividend, jlong divisor ) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   324
  // Check for invalid divisors
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   325
  assert( divisor != 0L && divisor != min_jlong,
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   326
          "bad divisor for transforming to long multiply" );
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   327
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   328
  bool d_pos = divisor >= 0;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   329
  jlong d = d_pos ? divisor : -divisor;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   330
  const int N = 64;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   331
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   332
  // Result
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   333
  Node *q = NULL;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   334
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   335
  if (d == 1) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   336
    // division by +/- 1
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   337
    if (!d_pos) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   338
      // Just negate the value
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   339
      q = new (phase->C, 3) SubLNode(phase->longcon(0), dividend);
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   340
    }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   341
  } else if ( is_power_of_2_long(d) ) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   342
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   343
    // division by +/- a power of 2
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   344
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   345
    // See if we can simply do a shift without rounding
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   346
    bool needs_rounding = true;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   347
    const Type *dt = phase->type(dividend);
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   348
    const TypeLong *dtl = dt->isa_long();
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   349
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   350
    if (dtl && dtl->_lo > 0) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   351
      // we don't need to round a positive dividend
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   352
      needs_rounding = false;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   353
    } else if( dividend->Opcode() == Op_AndL ) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   354
      // An AND mask of sufficient size clears the low bits and
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   355
      // I can avoid rounding.
1432
44f076e3d2a4 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 1067
diff changeset
   356
      const TypeLong *andconl_t = phase->type( dividend->in(2) )->isa_long();
44f076e3d2a4 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 1067
diff changeset
   357
      if( andconl_t && andconl_t->is_con() ) {
44f076e3d2a4 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 1067
diff changeset
   358
        jlong andconl = andconl_t->get_con();
44f076e3d2a4 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 1067
diff changeset
   359
        if( andconl < 0 && is_power_of_2_long(-andconl) && (-andconl) >= d ) {
4583
b36d52bd2d19 6910484: incorrect integer optimization (loosing and op-r in a given example)
kvn
parents: 2746
diff changeset
   360
          if( (-andconl) == d ) // Remove AND if it clears bits which will be shifted
b36d52bd2d19 6910484: incorrect integer optimization (loosing and op-r in a given example)
kvn
parents: 2746
diff changeset
   361
            dividend = dividend->in(1);
1432
44f076e3d2a4 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 1067
diff changeset
   362
          needs_rounding = false;
44f076e3d2a4 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 1067
diff changeset
   363
        }
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   364
      }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   365
    }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   366
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   367
    // Add rounding to the shift to handle the sign bit
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   368
    int l = log2_long(d-1)+1;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   369
    if (needs_rounding) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   370
      // Divide-by-power-of-2 can be made into a shift, but you have to do
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   371
      // more math for the rounding.  You need to add 0 for positive
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   372
      // numbers, and "i-1" for negative numbers.  Example: i=4, so the
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   373
      // shift is by 2.  You need to add 3 to negative dividends and 0 to
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   374
      // positive ones.  So (-7+3)>>2 becomes -1, (-4+3)>>2 becomes -1,
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   375
      // (-2+3)>>2 becomes 0, etc.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   376
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   377
      // Compute 0 or -1, based on sign bit
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   378
      Node *sign = phase->transform(new (phase->C, 3) RShiftLNode(dividend, phase->intcon(N - 1)));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   379
      // Mask sign bit to the low sign bits
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   380
      Node *round = phase->transform(new (phase->C, 3) URShiftLNode(sign, phase->intcon(N - l)));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   381
      // Round up before shifting
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   382
      dividend = phase->transform(new (phase->C, 3) AddLNode(dividend, round));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   383
    }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   384
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   385
    // Shift for division
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   386
    q = new (phase->C, 3) RShiftLNode(dividend, phase->intcon(l));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   387
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   388
    if (!d_pos) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   389
      q = new (phase->C, 3) SubLNode(phase->longcon(0), phase->transform(q));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   390
    }
7115
32300e243300 6987135: Performance regression on Intel platform with 32-bits edition between 6u13 and 6u14.
kvn
parents: 5547
diff changeset
   391
  } else if ( !Matcher::use_asm_for_ldiv_by_con(d) ) { // Use hardware DIV instruction when
32300e243300 6987135: Performance regression on Intel platform with 32-bits edition between 6u13 and 6u14.
kvn
parents: 5547
diff changeset
   392
                                                       // it is faster than code generated below.
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   393
    // Attempt the jlong constant divide -> multiply transform found in
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   394
    //   "Division by Invariant Integers using Multiplication"
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   395
    //     by Granlund and Montgomery
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   396
    // See also "Hacker's Delight", chapter 10 by Warren.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   397
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   398
    jlong magic_const;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   399
    jint shift_const;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   400
    if (magic_long_divide_constants(d, magic_const, shift_const)) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   401
      // Compute the high half of the dividend x magic multiplication
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   402
      Node *mul_hi = phase->transform(long_by_long_mulhi(phase, dividend, magic_const));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   403
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   404
      // The high half of the 128-bit multiply is computed.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   405
      if (magic_const < 0) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   406
        // The magic multiplier is too large for a 64 bit constant. We've adjusted
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   407
        // it down by 2^64, but have to add 1 dividend back in after the multiplication.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   408
        // This handles the "overflow" case described by Granlund and Montgomery.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   409
        mul_hi = phase->transform(new (phase->C, 3) AddLNode(dividend, mul_hi));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   410
      }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   411
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   412
      // Shift over the (adjusted) mulhi
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   413
      if (shift_const != 0) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   414
        mul_hi = phase->transform(new (phase->C, 3) RShiftLNode(mul_hi, phase->intcon(shift_const)));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   415
      }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   416
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   417
      // Get a 0 or -1 from the sign of the dividend.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   418
      Node *addend0 = mul_hi;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   419
      Node *addend1 = phase->transform(new (phase->C, 3) RShiftLNode(dividend, phase->intcon(N-1)));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   420
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   421
      // If the divisor is negative, swap the order of the input addends;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   422
      // this has the effect of negating the quotient.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   423
      if (!d_pos) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   424
        Node *temp = addend0; addend0 = addend1; addend1 = temp;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   425
      }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   426
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   427
      // Adjust the final quotient by subtracting -1 (adding 1)
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   428
      // from the mul_hi.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   429
      q = new (phase->C, 3) SubLNode(addend0, addend1);
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   430
    }
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   431
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   432
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   433
  return q;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   434
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   435
489c9b5090e2 Initial load
duke
parents:
diff changeset
   436
//=============================================================================
489c9b5090e2 Initial load
duke
parents:
diff changeset
   437
//------------------------------Identity---------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   438
// If the divisor is 1, we are an identity on the dividend.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   439
Node *DivINode::Identity( PhaseTransform *phase ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   440
  return (phase->type( in(2) )->higher_equal(TypeInt::ONE)) ? in(1) : this;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   441
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   442
489c9b5090e2 Initial load
duke
parents:
diff changeset
   443
//------------------------------Idealize---------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   444
// Divides can be changed to multiplies and/or shifts
489c9b5090e2 Initial load
duke
parents:
diff changeset
   445
Node *DivINode::Ideal(PhaseGVN *phase, bool can_reshape) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   446
  if (in(0) && remove_dead_region(phase, can_reshape))  return this;
1067
f82e0a8cd438 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 1056
diff changeset
   447
  // Don't bother trying to transform a dead node
f82e0a8cd438 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 1056
diff changeset
   448
  if( in(0) && in(0)->is_top() )  return NULL;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   449
489c9b5090e2 Initial load
duke
parents:
diff changeset
   450
  const Type *t = phase->type( in(2) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   451
  if( t == TypeInt::ONE )       // Identity?
489c9b5090e2 Initial load
duke
parents:
diff changeset
   452
    return NULL;                // Skip it
489c9b5090e2 Initial load
duke
parents:
diff changeset
   453
489c9b5090e2 Initial load
duke
parents:
diff changeset
   454
  const TypeInt *ti = t->isa_int();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   455
  if( !ti ) return NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   456
  if( !ti->is_con() ) return NULL;
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   457
  jint i = ti->get_con();       // Get divisor
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   458
489c9b5090e2 Initial load
duke
parents:
diff changeset
   459
  if (i == 0) return NULL;      // Dividing by zero constant does not idealize
489c9b5090e2 Initial load
duke
parents:
diff changeset
   460
489c9b5090e2 Initial load
duke
parents:
diff changeset
   461
  set_req(0,NULL);              // Dividing by a not-zero constant; no faulting
489c9b5090e2 Initial load
duke
parents:
diff changeset
   462
489c9b5090e2 Initial load
duke
parents:
diff changeset
   463
  // Dividing by MININT does not optimize as a power-of-2 shift.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   464
  if( i == min_jint ) return NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   465
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   466
  return transform_int_divide( phase, in(1), i );
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   467
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   468
489c9b5090e2 Initial load
duke
parents:
diff changeset
   469
//------------------------------Value------------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   470
// A DivINode divides its inputs.  The third input is a Control input, used to
489c9b5090e2 Initial load
duke
parents:
diff changeset
   471
// prevent hoisting the divide above an unsafe test.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   472
const Type *DivINode::Value( PhaseTransform *phase ) const {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   473
  // Either input is TOP ==> the result is TOP
489c9b5090e2 Initial load
duke
parents:
diff changeset
   474
  const Type *t1 = phase->type( in(1) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   475
  const Type *t2 = phase->type( in(2) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   476
  if( t1 == Type::TOP ) return Type::TOP;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   477
  if( t2 == Type::TOP ) return Type::TOP;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   478
489c9b5090e2 Initial load
duke
parents:
diff changeset
   479
  // x/x == 1 since we always generate the dynamic divisor check for 0.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   480
  if( phase->eqv( in(1), in(2) ) )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   481
    return TypeInt::ONE;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   482
489c9b5090e2 Initial load
duke
parents:
diff changeset
   483
  // Either input is BOTTOM ==> the result is the local BOTTOM
489c9b5090e2 Initial load
duke
parents:
diff changeset
   484
  const Type *bot = bottom_type();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   485
  if( (t1 == bot) || (t2 == bot) ||
489c9b5090e2 Initial load
duke
parents:
diff changeset
   486
      (t1 == Type::BOTTOM) || (t2 == Type::BOTTOM) )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   487
    return bot;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   488
489c9b5090e2 Initial load
duke
parents:
diff changeset
   489
  // Divide the two numbers.  We approximate.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   490
  // If divisor is a constant and not zero
489c9b5090e2 Initial load
duke
parents:
diff changeset
   491
  const TypeInt *i1 = t1->is_int();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   492
  const TypeInt *i2 = t2->is_int();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   493
  int widen = MAX2(i1->_widen, i2->_widen);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   494
489c9b5090e2 Initial load
duke
parents:
diff changeset
   495
  if( i2->is_con() && i2->get_con() != 0 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   496
    int32 d = i2->get_con(); // Divisor
489c9b5090e2 Initial load
duke
parents:
diff changeset
   497
    jint lo, hi;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   498
    if( d >= 0 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   499
      lo = i1->_lo/d;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   500
      hi = i1->_hi/d;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   501
    } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   502
      if( d == -1 && i1->_lo == min_jint ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   503
        // 'min_jint/-1' throws arithmetic exception during compilation
489c9b5090e2 Initial load
duke
parents:
diff changeset
   504
        lo = min_jint;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   505
        // do not support holes, 'hi' must go to either min_jint or max_jint:
489c9b5090e2 Initial load
duke
parents:
diff changeset
   506
        // [min_jint, -10]/[-1,-1] ==> [min_jint] UNION [10,max_jint]
489c9b5090e2 Initial load
duke
parents:
diff changeset
   507
        hi = i1->_hi == min_jint ? min_jint : max_jint;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   508
      } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   509
        lo = i1->_hi/d;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   510
        hi = i1->_lo/d;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   511
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   512
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   513
    return TypeInt::make(lo, hi, widen);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   514
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   515
489c9b5090e2 Initial load
duke
parents:
diff changeset
   516
  // If the dividend is a constant
489c9b5090e2 Initial load
duke
parents:
diff changeset
   517
  if( i1->is_con() ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   518
    int32 d = i1->get_con();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   519
    if( d < 0 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   520
      if( d == min_jint ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   521
        //  (-min_jint) == min_jint == (min_jint / -1)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   522
        return TypeInt::make(min_jint, max_jint/2 + 1, widen);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   523
      } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   524
        return TypeInt::make(d, -d, widen);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   525
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   526
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   527
    return TypeInt::make(-d, d, widen);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   528
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   529
489c9b5090e2 Initial load
duke
parents:
diff changeset
   530
  // Otherwise we give up all hope
489c9b5090e2 Initial load
duke
parents:
diff changeset
   531
  return TypeInt::INT;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   532
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   533
489c9b5090e2 Initial load
duke
parents:
diff changeset
   534
489c9b5090e2 Initial load
duke
parents:
diff changeset
   535
//=============================================================================
489c9b5090e2 Initial load
duke
parents:
diff changeset
   536
//------------------------------Identity---------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   537
// If the divisor is 1, we are an identity on the dividend.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   538
Node *DivLNode::Identity( PhaseTransform *phase ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   539
  return (phase->type( in(2) )->higher_equal(TypeLong::ONE)) ? in(1) : this;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   540
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   541
489c9b5090e2 Initial load
duke
parents:
diff changeset
   542
//------------------------------Idealize---------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   543
// Dividing by a power of 2 is a shift.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   544
Node *DivLNode::Ideal( PhaseGVN *phase, bool can_reshape) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   545
  if (in(0) && remove_dead_region(phase, can_reshape))  return this;
1067
f82e0a8cd438 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 1056
diff changeset
   546
  // Don't bother trying to transform a dead node
f82e0a8cd438 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 1056
diff changeset
   547
  if( in(0) && in(0)->is_top() )  return NULL;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   548
489c9b5090e2 Initial load
duke
parents:
diff changeset
   549
  const Type *t = phase->type( in(2) );
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   550
  if( t == TypeLong::ONE )      // Identity?
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   551
    return NULL;                // Skip it
489c9b5090e2 Initial load
duke
parents:
diff changeset
   552
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   553
  const TypeLong *tl = t->isa_long();
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   554
  if( !tl ) return NULL;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   555
  if( !tl->is_con() ) return NULL;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   556
  jlong l = tl->get_con();      // Get divisor
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   557
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   558
  if (l == 0) return NULL;      // Dividing by zero constant does not idealize
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   559
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   560
  set_req(0,NULL);              // Dividing by a not-zero constant; no faulting
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   561
7115
32300e243300 6987135: Performance regression on Intel platform with 32-bits edition between 6u13 and 6u14.
kvn
parents: 5547
diff changeset
   562
  // Dividing by MINLONG does not optimize as a power-of-2 shift.
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   563
  if( l == min_jlong ) return NULL;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   564
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   565
  return transform_long_divide( phase, in(1), l );
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   566
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   567
489c9b5090e2 Initial load
duke
parents:
diff changeset
   568
//------------------------------Value------------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   569
// A DivLNode divides its inputs.  The third input is a Control input, used to
489c9b5090e2 Initial load
duke
parents:
diff changeset
   570
// prevent hoisting the divide above an unsafe test.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   571
const Type *DivLNode::Value( PhaseTransform *phase ) const {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   572
  // Either input is TOP ==> the result is TOP
489c9b5090e2 Initial load
duke
parents:
diff changeset
   573
  const Type *t1 = phase->type( in(1) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   574
  const Type *t2 = phase->type( in(2) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   575
  if( t1 == Type::TOP ) return Type::TOP;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   576
  if( t2 == Type::TOP ) return Type::TOP;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   577
489c9b5090e2 Initial load
duke
parents:
diff changeset
   578
  // x/x == 1 since we always generate the dynamic divisor check for 0.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   579
  if( phase->eqv( in(1), in(2) ) )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   580
    return TypeLong::ONE;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   581
489c9b5090e2 Initial load
duke
parents:
diff changeset
   582
  // Either input is BOTTOM ==> the result is the local BOTTOM
489c9b5090e2 Initial load
duke
parents:
diff changeset
   583
  const Type *bot = bottom_type();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   584
  if( (t1 == bot) || (t2 == bot) ||
489c9b5090e2 Initial load
duke
parents:
diff changeset
   585
      (t1 == Type::BOTTOM) || (t2 == Type::BOTTOM) )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   586
    return bot;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   587
489c9b5090e2 Initial load
duke
parents:
diff changeset
   588
  // Divide the two numbers.  We approximate.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   589
  // If divisor is a constant and not zero
489c9b5090e2 Initial load
duke
parents:
diff changeset
   590
  const TypeLong *i1 = t1->is_long();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   591
  const TypeLong *i2 = t2->is_long();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   592
  int widen = MAX2(i1->_widen, i2->_widen);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   593
489c9b5090e2 Initial load
duke
parents:
diff changeset
   594
  if( i2->is_con() && i2->get_con() != 0 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   595
    jlong d = i2->get_con();    // Divisor
489c9b5090e2 Initial load
duke
parents:
diff changeset
   596
    jlong lo, hi;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   597
    if( d >= 0 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   598
      lo = i1->_lo/d;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   599
      hi = i1->_hi/d;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   600
    } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   601
      if( d == CONST64(-1) && i1->_lo == min_jlong ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   602
        // 'min_jlong/-1' throws arithmetic exception during compilation
489c9b5090e2 Initial load
duke
parents:
diff changeset
   603
        lo = min_jlong;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   604
        // do not support holes, 'hi' must go to either min_jlong or max_jlong:
489c9b5090e2 Initial load
duke
parents:
diff changeset
   605
        // [min_jlong, -10]/[-1,-1] ==> [min_jlong] UNION [10,max_jlong]
489c9b5090e2 Initial load
duke
parents:
diff changeset
   606
        hi = i1->_hi == min_jlong ? min_jlong : max_jlong;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   607
      } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   608
        lo = i1->_hi/d;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   609
        hi = i1->_lo/d;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   610
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   611
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   612
    return TypeLong::make(lo, hi, widen);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   613
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   614
489c9b5090e2 Initial load
duke
parents:
diff changeset
   615
  // If the dividend is a constant
489c9b5090e2 Initial load
duke
parents:
diff changeset
   616
  if( i1->is_con() ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   617
    jlong d = i1->get_con();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   618
    if( d < 0 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   619
      if( d == min_jlong ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   620
        //  (-min_jlong) == min_jlong == (min_jlong / -1)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   621
        return TypeLong::make(min_jlong, max_jlong/2 + 1, widen);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   622
      } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   623
        return TypeLong::make(d, -d, widen);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   624
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   625
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   626
    return TypeLong::make(-d, d, widen);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   627
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   628
489c9b5090e2 Initial load
duke
parents:
diff changeset
   629
  // Otherwise we give up all hope
489c9b5090e2 Initial load
duke
parents:
diff changeset
   630
  return TypeLong::LONG;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   631
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   632
489c9b5090e2 Initial load
duke
parents:
diff changeset
   633
489c9b5090e2 Initial load
duke
parents:
diff changeset
   634
//=============================================================================
489c9b5090e2 Initial load
duke
parents:
diff changeset
   635
//------------------------------Value------------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   636
// An DivFNode divides its inputs.  The third input is a Control input, used to
489c9b5090e2 Initial load
duke
parents:
diff changeset
   637
// prevent hoisting the divide above an unsafe test.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   638
const Type *DivFNode::Value( PhaseTransform *phase ) const {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   639
  // Either input is TOP ==> the result is TOP
489c9b5090e2 Initial load
duke
parents:
diff changeset
   640
  const Type *t1 = phase->type( in(1) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   641
  const Type *t2 = phase->type( in(2) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   642
  if( t1 == Type::TOP ) return Type::TOP;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   643
  if( t2 == Type::TOP ) return Type::TOP;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   644
489c9b5090e2 Initial load
duke
parents:
diff changeset
   645
  // Either input is BOTTOM ==> the result is the local BOTTOM
489c9b5090e2 Initial load
duke
parents:
diff changeset
   646
  const Type *bot = bottom_type();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   647
  if( (t1 == bot) || (t2 == bot) ||
489c9b5090e2 Initial load
duke
parents:
diff changeset
   648
      (t1 == Type::BOTTOM) || (t2 == Type::BOTTOM) )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   649
    return bot;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   650
489c9b5090e2 Initial load
duke
parents:
diff changeset
   651
  // x/x == 1, we ignore 0/0.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   652
  // Note: if t1 and t2 are zero then result is NaN (JVMS page 213)
378
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
   653
  // Does not work for variables because of NaN's
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   654
  if( phase->eqv( in(1), in(2) ) && t1->base() == Type::FloatCon)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   655
    if (!g_isnan(t1->getf()) && g_isfinite(t1->getf()) && t1->getf() != 0.0) // could be negative ZERO or NaN
489c9b5090e2 Initial load
duke
parents:
diff changeset
   656
      return TypeF::ONE;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   657
489c9b5090e2 Initial load
duke
parents:
diff changeset
   658
  if( t2 == TypeF::ONE )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   659
    return t1;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   660
489c9b5090e2 Initial load
duke
parents:
diff changeset
   661
  // If divisor is a constant and not zero, divide them numbers
489c9b5090e2 Initial load
duke
parents:
diff changeset
   662
  if( t1->base() == Type::FloatCon &&
489c9b5090e2 Initial load
duke
parents:
diff changeset
   663
      t2->base() == Type::FloatCon &&
489c9b5090e2 Initial load
duke
parents:
diff changeset
   664
      t2->getf() != 0.0 ) // could be negative zero
489c9b5090e2 Initial load
duke
parents:
diff changeset
   665
    return TypeF::make( t1->getf()/t2->getf() );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   666
489c9b5090e2 Initial load
duke
parents:
diff changeset
   667
  // If the dividend is a constant zero
489c9b5090e2 Initial load
duke
parents:
diff changeset
   668
  // Note: if t1 and t2 are zero then result is NaN (JVMS page 213)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   669
  // Test TypeF::ZERO is not sufficient as it could be negative zero
489c9b5090e2 Initial load
duke
parents:
diff changeset
   670
489c9b5090e2 Initial load
duke
parents:
diff changeset
   671
  if( t1 == TypeF::ZERO && !g_isnan(t2->getf()) && t2->getf() != 0.0 )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   672
    return TypeF::ZERO;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   673
489c9b5090e2 Initial load
duke
parents:
diff changeset
   674
  // Otherwise we give up all hope
489c9b5090e2 Initial load
duke
parents:
diff changeset
   675
  return Type::FLOAT;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   676
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   677
489c9b5090e2 Initial load
duke
parents:
diff changeset
   678
//------------------------------isA_Copy---------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   679
// Dividing by self is 1.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   680
// If the divisor is 1, we are an identity on the dividend.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   681
Node *DivFNode::Identity( PhaseTransform *phase ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   682
  return (phase->type( in(2) ) == TypeF::ONE) ? in(1) : this;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   683
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   684
489c9b5090e2 Initial load
duke
parents:
diff changeset
   685
489c9b5090e2 Initial load
duke
parents:
diff changeset
   686
//------------------------------Idealize---------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   687
Node *DivFNode::Ideal(PhaseGVN *phase, bool can_reshape) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   688
  if (in(0) && remove_dead_region(phase, can_reshape))  return this;
1067
f82e0a8cd438 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 1056
diff changeset
   689
  // Don't bother trying to transform a dead node
f82e0a8cd438 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 1056
diff changeset
   690
  if( in(0) && in(0)->is_top() )  return NULL;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   691
489c9b5090e2 Initial load
duke
parents:
diff changeset
   692
  const Type *t2 = phase->type( in(2) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   693
  if( t2 == TypeF::ONE )         // Identity?
489c9b5090e2 Initial load
duke
parents:
diff changeset
   694
    return NULL;                // Skip it
489c9b5090e2 Initial load
duke
parents:
diff changeset
   695
489c9b5090e2 Initial load
duke
parents:
diff changeset
   696
  const TypeF *tf = t2->isa_float_constant();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   697
  if( !tf ) return NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   698
  if( tf->base() != Type::FloatCon ) return NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   699
489c9b5090e2 Initial load
duke
parents:
diff changeset
   700
  // Check for out of range values
489c9b5090e2 Initial load
duke
parents:
diff changeset
   701
  if( tf->is_nan() || !tf->is_finite() ) return NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   702
489c9b5090e2 Initial load
duke
parents:
diff changeset
   703
  // Get the value
489c9b5090e2 Initial load
duke
parents:
diff changeset
   704
  float f = tf->getf();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   705
  int exp;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   706
489c9b5090e2 Initial load
duke
parents:
diff changeset
   707
  // Only for special case of dividing by a power of 2
489c9b5090e2 Initial load
duke
parents:
diff changeset
   708
  if( frexp((double)f, &exp) != 0.5 ) return NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   709
489c9b5090e2 Initial load
duke
parents:
diff changeset
   710
  // Limit the range of acceptable exponents
489c9b5090e2 Initial load
duke
parents:
diff changeset
   711
  if( exp < -126 || exp > 126 ) return NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   712
489c9b5090e2 Initial load
duke
parents:
diff changeset
   713
  // Compute the reciprocal
489c9b5090e2 Initial load
duke
parents:
diff changeset
   714
  float reciprocal = ((float)1.0) / f;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   715
489c9b5090e2 Initial load
duke
parents:
diff changeset
   716
  assert( frexp((double)reciprocal, &exp) == 0.5, "reciprocal should be power of 2" );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   717
489c9b5090e2 Initial load
duke
parents:
diff changeset
   718
  // return multiplication by the reciprocal
489c9b5090e2 Initial load
duke
parents:
diff changeset
   719
  return (new (phase->C, 3) MulFNode(in(1), phase->makecon(TypeF::make(reciprocal))));
489c9b5090e2 Initial load
duke
parents:
diff changeset
   720
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   721
489c9b5090e2 Initial load
duke
parents:
diff changeset
   722
//=============================================================================
489c9b5090e2 Initial load
duke
parents:
diff changeset
   723
//------------------------------Value------------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   724
// An DivDNode divides its inputs.  The third input is a Control input, used to
378
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
   725
// prevent hoisting the divide above an unsafe test.
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   726
const Type *DivDNode::Value( PhaseTransform *phase ) const {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   727
  // Either input is TOP ==> the result is TOP
489c9b5090e2 Initial load
duke
parents:
diff changeset
   728
  const Type *t1 = phase->type( in(1) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   729
  const Type *t2 = phase->type( in(2) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   730
  if( t1 == Type::TOP ) return Type::TOP;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   731
  if( t2 == Type::TOP ) return Type::TOP;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   732
489c9b5090e2 Initial load
duke
parents:
diff changeset
   733
  // Either input is BOTTOM ==> the result is the local BOTTOM
489c9b5090e2 Initial load
duke
parents:
diff changeset
   734
  const Type *bot = bottom_type();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   735
  if( (t1 == bot) || (t2 == bot) ||
489c9b5090e2 Initial load
duke
parents:
diff changeset
   736
      (t1 == Type::BOTTOM) || (t2 == Type::BOTTOM) )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   737
    return bot;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   738
489c9b5090e2 Initial load
duke
parents:
diff changeset
   739
  // x/x == 1, we ignore 0/0.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   740
  // Note: if t1 and t2 are zero then result is NaN (JVMS page 213)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   741
  // Does not work for variables because of NaN's
489c9b5090e2 Initial load
duke
parents:
diff changeset
   742
  if( phase->eqv( in(1), in(2) ) && t1->base() == Type::DoubleCon)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   743
    if (!g_isnan(t1->getd()) && g_isfinite(t1->getd()) && t1->getd() != 0.0) // could be negative ZERO or NaN
489c9b5090e2 Initial load
duke
parents:
diff changeset
   744
      return TypeD::ONE;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   745
489c9b5090e2 Initial load
duke
parents:
diff changeset
   746
  if( t2 == TypeD::ONE )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   747
    return t1;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   748
1436
6869d58f4f58 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 1432
diff changeset
   749
#if defined(IA32)
6869d58f4f58 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 1432
diff changeset
   750
  if (!phase->C->method()->is_strict())
6869d58f4f58 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 1432
diff changeset
   751
    // Can't trust native compilers to properly fold strict double
6869d58f4f58 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 1432
diff changeset
   752
    // division with round-to-zero on this platform.
6869d58f4f58 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 1432
diff changeset
   753
#endif
6869d58f4f58 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 1432
diff changeset
   754
    {
6869d58f4f58 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 1432
diff changeset
   755
      // If divisor is a constant and not zero, divide them numbers
6869d58f4f58 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 1432
diff changeset
   756
      if( t1->base() == Type::DoubleCon &&
6869d58f4f58 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 1432
diff changeset
   757
          t2->base() == Type::DoubleCon &&
6869d58f4f58 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 1432
diff changeset
   758
          t2->getd() != 0.0 ) // could be negative zero
6869d58f4f58 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 1432
diff changeset
   759
        return TypeD::make( t1->getd()/t2->getd() );
6869d58f4f58 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 1432
diff changeset
   760
    }
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   761
489c9b5090e2 Initial load
duke
parents:
diff changeset
   762
  // If the dividend is a constant zero
489c9b5090e2 Initial load
duke
parents:
diff changeset
   763
  // Note: if t1 and t2 are zero then result is NaN (JVMS page 213)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   764
  // Test TypeF::ZERO is not sufficient as it could be negative zero
489c9b5090e2 Initial load
duke
parents:
diff changeset
   765
  if( t1 == TypeD::ZERO && !g_isnan(t2->getd()) && t2->getd() != 0.0 )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   766
    return TypeD::ZERO;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   767
489c9b5090e2 Initial load
duke
parents:
diff changeset
   768
  // Otherwise we give up all hope
489c9b5090e2 Initial load
duke
parents:
diff changeset
   769
  return Type::DOUBLE;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   770
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   771
489c9b5090e2 Initial load
duke
parents:
diff changeset
   772
489c9b5090e2 Initial load
duke
parents:
diff changeset
   773
//------------------------------isA_Copy---------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   774
// Dividing by self is 1.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   775
// If the divisor is 1, we are an identity on the dividend.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   776
Node *DivDNode::Identity( PhaseTransform *phase ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   777
  return (phase->type( in(2) ) == TypeD::ONE) ? in(1) : this;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   778
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   779
489c9b5090e2 Initial load
duke
parents:
diff changeset
   780
//------------------------------Idealize---------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   781
Node *DivDNode::Ideal(PhaseGVN *phase, bool can_reshape) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   782
  if (in(0) && remove_dead_region(phase, can_reshape))  return this;
1067
f82e0a8cd438 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 1056
diff changeset
   783
  // Don't bother trying to transform a dead node
f82e0a8cd438 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 1056
diff changeset
   784
  if( in(0) && in(0)->is_top() )  return NULL;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   785
489c9b5090e2 Initial load
duke
parents:
diff changeset
   786
  const Type *t2 = phase->type( in(2) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   787
  if( t2 == TypeD::ONE )         // Identity?
489c9b5090e2 Initial load
duke
parents:
diff changeset
   788
    return NULL;                // Skip it
489c9b5090e2 Initial load
duke
parents:
diff changeset
   789
489c9b5090e2 Initial load
duke
parents:
diff changeset
   790
  const TypeD *td = t2->isa_double_constant();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   791
  if( !td ) return NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   792
  if( td->base() != Type::DoubleCon ) return NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   793
489c9b5090e2 Initial load
duke
parents:
diff changeset
   794
  // Check for out of range values
489c9b5090e2 Initial load
duke
parents:
diff changeset
   795
  if( td->is_nan() || !td->is_finite() ) return NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   796
489c9b5090e2 Initial load
duke
parents:
diff changeset
   797
  // Get the value
489c9b5090e2 Initial load
duke
parents:
diff changeset
   798
  double d = td->getd();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   799
  int exp;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   800
489c9b5090e2 Initial load
duke
parents:
diff changeset
   801
  // Only for special case of dividing by a power of 2
489c9b5090e2 Initial load
duke
parents:
diff changeset
   802
  if( frexp(d, &exp) != 0.5 ) return NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   803
489c9b5090e2 Initial load
duke
parents:
diff changeset
   804
  // Limit the range of acceptable exponents
489c9b5090e2 Initial load
duke
parents:
diff changeset
   805
  if( exp < -1021 || exp > 1022 ) return NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   806
489c9b5090e2 Initial load
duke
parents:
diff changeset
   807
  // Compute the reciprocal
489c9b5090e2 Initial load
duke
parents:
diff changeset
   808
  double reciprocal = 1.0 / d;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   809
489c9b5090e2 Initial load
duke
parents:
diff changeset
   810
  assert( frexp(reciprocal, &exp) == 0.5, "reciprocal should be power of 2" );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   811
489c9b5090e2 Initial load
duke
parents:
diff changeset
   812
  // return multiplication by the reciprocal
489c9b5090e2 Initial load
duke
parents:
diff changeset
   813
  return (new (phase->C, 3) MulDNode(in(1), phase->makecon(TypeD::make(reciprocal))));
489c9b5090e2 Initial load
duke
parents:
diff changeset
   814
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   815
489c9b5090e2 Initial load
duke
parents:
diff changeset
   816
//=============================================================================
489c9b5090e2 Initial load
duke
parents:
diff changeset
   817
//------------------------------Idealize---------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   818
Node *ModINode::Ideal(PhaseGVN *phase, bool can_reshape) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   819
  // Check for dead control input
1067
f82e0a8cd438 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 1056
diff changeset
   820
  if( in(0) && remove_dead_region(phase, can_reshape) )  return this;
f82e0a8cd438 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 1056
diff changeset
   821
  // Don't bother trying to transform a dead node
f82e0a8cd438 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 1056
diff changeset
   822
  if( in(0) && in(0)->is_top() )  return NULL;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   823
489c9b5090e2 Initial load
duke
parents:
diff changeset
   824
  // Get the modulus
489c9b5090e2 Initial load
duke
parents:
diff changeset
   825
  const Type *t = phase->type( in(2) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   826
  if( t == Type::TOP ) return NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   827
  const TypeInt *ti = t->is_int();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   828
489c9b5090e2 Initial load
duke
parents:
diff changeset
   829
  // Check for useless control input
489c9b5090e2 Initial load
duke
parents:
diff changeset
   830
  // Check for excluding mod-zero case
489c9b5090e2 Initial load
duke
parents:
diff changeset
   831
  if( in(0) && (ti->_hi < 0 || ti->_lo > 0) ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   832
    set_req(0, NULL);        // Yank control input
489c9b5090e2 Initial load
duke
parents:
diff changeset
   833
    return this;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   834
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   835
489c9b5090e2 Initial load
duke
parents:
diff changeset
   836
  // See if we are MOD'ing by 2^k or 2^k-1.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   837
  if( !ti->is_con() ) return NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   838
  jint con = ti->get_con();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   839
489c9b5090e2 Initial load
duke
parents:
diff changeset
   840
  Node *hook = new (phase->C, 1) Node(1);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   841
489c9b5090e2 Initial load
duke
parents:
diff changeset
   842
  // First, special check for modulo 2^k-1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   843
  if( con >= 0 && con < max_jint && is_power_of_2(con+1) ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   844
    uint k = exact_log2(con+1);  // Extract k
489c9b5090e2 Initial load
duke
parents:
diff changeset
   845
489c9b5090e2 Initial load
duke
parents:
diff changeset
   846
    // Basic algorithm by David Detlefs.  See fastmod_int.java for gory details.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   847
    static int unroll_factor[] = { 999, 999, 29, 14, 9, 7, 5, 4, 4, 3, 3, 2, 2, 2, 2, 2, 1 /*past here we assume 1 forever*/};
489c9b5090e2 Initial load
duke
parents:
diff changeset
   848
    int trip_count = 1;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   849
    if( k < ARRAY_SIZE(unroll_factor))  trip_count = unroll_factor[k];
489c9b5090e2 Initial load
duke
parents:
diff changeset
   850
489c9b5090e2 Initial load
duke
parents:
diff changeset
   851
    // If the unroll factor is not too large, and if conditional moves are
489c9b5090e2 Initial load
duke
parents:
diff changeset
   852
    // ok, then use this case
489c9b5090e2 Initial load
duke
parents:
diff changeset
   853
    if( trip_count <= 5 && ConditionalMoveLimit != 0 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   854
      Node *x = in(1);            // Value being mod'd
489c9b5090e2 Initial load
duke
parents:
diff changeset
   855
      Node *divisor = in(2);      // Also is mask
489c9b5090e2 Initial load
duke
parents:
diff changeset
   856
489c9b5090e2 Initial load
duke
parents:
diff changeset
   857
      hook->init_req(0, x);       // Add a use to x to prevent him from dying
489c9b5090e2 Initial load
duke
parents:
diff changeset
   858
      // Generate code to reduce X rapidly to nearly 2^k-1.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   859
      for( int i = 0; i < trip_count; i++ ) {
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   860
        Node *xl = phase->transform( new (phase->C, 3) AndINode(x,divisor) );
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   861
        Node *xh = phase->transform( new (phase->C, 3) RShiftINode(x,phase->intcon(k)) ); // Must be signed
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   862
        x = phase->transform( new (phase->C, 3) AddINode(xh,xl) );
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   863
        hook->set_req(0, x);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   864
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   865
489c9b5090e2 Initial load
duke
parents:
diff changeset
   866
      // Generate sign-fixup code.  Was original value positive?
489c9b5090e2 Initial load
duke
parents:
diff changeset
   867
      // int hack_res = (i >= 0) ? divisor : 1;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   868
      Node *cmp1 = phase->transform( new (phase->C, 3) CmpINode( in(1), phase->intcon(0) ) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   869
      Node *bol1 = phase->transform( new (phase->C, 2) BoolNode( cmp1, BoolTest::ge ) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   870
      Node *cmov1= phase->transform( new (phase->C, 4) CMoveINode(bol1, phase->intcon(1), divisor, TypeInt::POS) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   871
      // if( x >= hack_res ) x -= divisor;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   872
      Node *sub  = phase->transform( new (phase->C, 3) SubINode( x, divisor ) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   873
      Node *cmp2 = phase->transform( new (phase->C, 3) CmpINode( x, cmov1 ) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   874
      Node *bol2 = phase->transform( new (phase->C, 2) BoolNode( cmp2, BoolTest::ge ) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   875
      // Convention is to not transform the return value of an Ideal
489c9b5090e2 Initial load
duke
parents:
diff changeset
   876
      // since Ideal is expected to return a modified 'this' or a new node.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   877
      Node *cmov2= new (phase->C, 4) CMoveINode(bol2, x, sub, TypeInt::INT);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   878
      // cmov2 is now the mod
489c9b5090e2 Initial load
duke
parents:
diff changeset
   879
489c9b5090e2 Initial load
duke
parents:
diff changeset
   880
      // Now remove the bogus extra edges used to keep things alive
489c9b5090e2 Initial load
duke
parents:
diff changeset
   881
      if (can_reshape) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   882
        phase->is_IterGVN()->remove_dead_node(hook);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   883
      } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   884
        hook->set_req(0, NULL);   // Just yank bogus edge during Parse phase
489c9b5090e2 Initial load
duke
parents:
diff changeset
   885
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   886
      return cmov2;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   887
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   888
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   889
489c9b5090e2 Initial load
duke
parents:
diff changeset
   890
  // Fell thru, the unroll case is not appropriate. Transform the modulo
489c9b5090e2 Initial load
duke
parents:
diff changeset
   891
  // into a long multiply/int multiply/subtract case
489c9b5090e2 Initial load
duke
parents:
diff changeset
   892
489c9b5090e2 Initial load
duke
parents:
diff changeset
   893
  // Cannot handle mod 0, and min_jint isn't handled by the transform
489c9b5090e2 Initial load
duke
parents:
diff changeset
   894
  if( con == 0 || con == min_jint ) return NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   895
489c9b5090e2 Initial load
duke
parents:
diff changeset
   896
  // Get the absolute value of the constant; at this point, we can use this
489c9b5090e2 Initial load
duke
parents:
diff changeset
   897
  jint pos_con = (con >= 0) ? con : -con;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   898
489c9b5090e2 Initial load
duke
parents:
diff changeset
   899
  // integer Mod 1 is always 0
489c9b5090e2 Initial load
duke
parents:
diff changeset
   900
  if( pos_con == 1 ) return new (phase->C, 1) ConINode(TypeInt::ZERO);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   901
489c9b5090e2 Initial load
duke
parents:
diff changeset
   902
  int log2_con = -1;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   903
489c9b5090e2 Initial load
duke
parents:
diff changeset
   904
  // If this is a power of two, they maybe we can mask it
489c9b5090e2 Initial load
duke
parents:
diff changeset
   905
  if( is_power_of_2(pos_con) ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   906
    log2_con = log2_intptr((intptr_t)pos_con);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   907
489c9b5090e2 Initial load
duke
parents:
diff changeset
   908
    const Type *dt = phase->type(in(1));
489c9b5090e2 Initial load
duke
parents:
diff changeset
   909
    const TypeInt *dti = dt->isa_int();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   910
489c9b5090e2 Initial load
duke
parents:
diff changeset
   911
    // See if this can be masked, if the dividend is non-negative
489c9b5090e2 Initial load
duke
parents:
diff changeset
   912
    if( dti && dti->_lo >= 0 )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   913
      return ( new (phase->C, 3) AndINode( in(1), phase->intcon( pos_con-1 ) ) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   914
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   915
489c9b5090e2 Initial load
duke
parents:
diff changeset
   916
  // Save in(1) so that it cannot be changed or deleted
489c9b5090e2 Initial load
duke
parents:
diff changeset
   917
  hook->init_req(0, in(1));
489c9b5090e2 Initial load
duke
parents:
diff changeset
   918
489c9b5090e2 Initial load
duke
parents:
diff changeset
   919
  // Divide using the transform from DivI to MulL
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   920
  Node *result = transform_int_divide( phase, in(1), pos_con );
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   921
  if (result != NULL) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   922
    Node *divide = phase->transform(result);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   923
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   924
    // Re-multiply, using a shift if this is a power of two
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   925
    Node *mult = NULL;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   926
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   927
    if( log2_con >= 0 )
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   928
      mult = phase->transform( new (phase->C, 3) LShiftINode( divide, phase->intcon( log2_con ) ) );
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   929
    else
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   930
      mult = phase->transform( new (phase->C, 3) MulINode( divide, phase->intcon( pos_con ) ) );
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   931
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   932
    // Finally, subtract the multiplied divided value from the original
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   933
    result = new (phase->C, 3) SubINode( in(1), mult );
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   934
  }
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   935
489c9b5090e2 Initial load
duke
parents:
diff changeset
   936
  // Now remove the bogus extra edges used to keep things alive
489c9b5090e2 Initial load
duke
parents:
diff changeset
   937
  if (can_reshape) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   938
    phase->is_IterGVN()->remove_dead_node(hook);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   939
  } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   940
    hook->set_req(0, NULL);       // Just yank bogus edge during Parse phase
489c9b5090e2 Initial load
duke
parents:
diff changeset
   941
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   942
489c9b5090e2 Initial load
duke
parents:
diff changeset
   943
  // return the value
489c9b5090e2 Initial load
duke
parents:
diff changeset
   944
  return result;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   945
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   946
489c9b5090e2 Initial load
duke
parents:
diff changeset
   947
//------------------------------Value------------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   948
const Type *ModINode::Value( PhaseTransform *phase ) const {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   949
  // Either input is TOP ==> the result is TOP
489c9b5090e2 Initial load
duke
parents:
diff changeset
   950
  const Type *t1 = phase->type( in(1) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   951
  const Type *t2 = phase->type( in(2) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   952
  if( t1 == Type::TOP ) return Type::TOP;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   953
  if( t2 == Type::TOP ) return Type::TOP;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   954
489c9b5090e2 Initial load
duke
parents:
diff changeset
   955
  // We always generate the dynamic check for 0.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   956
  // 0 MOD X is 0
489c9b5090e2 Initial load
duke
parents:
diff changeset
   957
  if( t1 == TypeInt::ZERO ) return TypeInt::ZERO;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   958
  // X MOD X is 0
489c9b5090e2 Initial load
duke
parents:
diff changeset
   959
  if( phase->eqv( in(1), in(2) ) ) return TypeInt::ZERO;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   960
489c9b5090e2 Initial load
duke
parents:
diff changeset
   961
  // Either input is BOTTOM ==> the result is the local BOTTOM
489c9b5090e2 Initial load
duke
parents:
diff changeset
   962
  const Type *bot = bottom_type();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   963
  if( (t1 == bot) || (t2 == bot) ||
489c9b5090e2 Initial load
duke
parents:
diff changeset
   964
      (t1 == Type::BOTTOM) || (t2 == Type::BOTTOM) )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   965
    return bot;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   966
489c9b5090e2 Initial load
duke
parents:
diff changeset
   967
  const TypeInt *i1 = t1->is_int();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   968
  const TypeInt *i2 = t2->is_int();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   969
  if( !i1->is_con() || !i2->is_con() ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   970
    if( i1->_lo >= 0 && i2->_lo >= 0 )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   971
      return TypeInt::POS;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   972
    // If both numbers are not constants, we know little.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   973
    return TypeInt::INT;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   974
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   975
  // Mod by zero?  Throw exception at runtime!
489c9b5090e2 Initial load
duke
parents:
diff changeset
   976
  if( !i2->get_con() ) return TypeInt::POS;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   977
489c9b5090e2 Initial load
duke
parents:
diff changeset
   978
  // We must be modulo'ing 2 float constants.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   979
  // Check for min_jint % '-1', result is defined to be '0'.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   980
  if( i1->get_con() == min_jint && i2->get_con() == -1 )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   981
    return TypeInt::ZERO;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   982
489c9b5090e2 Initial load
duke
parents:
diff changeset
   983
  return TypeInt::make( i1->get_con() % i2->get_con() );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   984
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   985
489c9b5090e2 Initial load
duke
parents:
diff changeset
   986
489c9b5090e2 Initial load
duke
parents:
diff changeset
   987
//=============================================================================
489c9b5090e2 Initial load
duke
parents:
diff changeset
   988
//------------------------------Idealize---------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   989
Node *ModLNode::Ideal(PhaseGVN *phase, bool can_reshape) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   990
  // Check for dead control input
1067
f82e0a8cd438 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 1056
diff changeset
   991
  if( in(0) && remove_dead_region(phase, can_reshape) )  return this;
f82e0a8cd438 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 1056
diff changeset
   992
  // Don't bother trying to transform a dead node
f82e0a8cd438 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 1056
diff changeset
   993
  if( in(0) && in(0)->is_top() )  return NULL;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   994
489c9b5090e2 Initial load
duke
parents:
diff changeset
   995
  // Get the modulus
489c9b5090e2 Initial load
duke
parents:
diff changeset
   996
  const Type *t = phase->type( in(2) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   997
  if( t == Type::TOP ) return NULL;
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
   998
  const TypeLong *tl = t->is_long();
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   999
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1000
  // Check for useless control input
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1001
  // Check for excluding mod-zero case
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1002
  if( in(0) && (tl->_hi < 0 || tl->_lo > 0) ) {
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1003
    set_req(0, NULL);        // Yank control input
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1004
    return this;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1005
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1006
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1007
  // See if we are MOD'ing by 2^k or 2^k-1.
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1008
  if( !tl->is_con() ) return NULL;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1009
  jlong con = tl->get_con();
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1010
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1011
  Node *hook = new (phase->C, 1) Node(1);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1012
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1013
  // Expand mod
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1014
  if( con >= 0 && con < max_jlong && is_power_of_2_long(con+1) ) {
2032
1e27661bff28 6805724: ModLNode::Ideal() generates functionally incorrect graph when divisor is any (2^k-1) constant.
twisti
parents: 2031
diff changeset
  1015
    uint k = exact_log2_long(con+1);  // Extract k
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1016
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1017
    // Basic algorithm by David Detlefs.  See fastmod_long.java for gory details.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1018
    // Used to help a popular random number generator which does a long-mod
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1019
    // of 2^31-1 and shows up in SpecJBB and SciMark.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1020
    static int unroll_factor[] = { 999, 999, 61, 30, 20, 15, 12, 10, 8, 7, 6, 6, 5, 5, 4, 4, 4, 3, 3, 3, 3, 3, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1 /*past here we assume 1 forever*/};
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1021
    int trip_count = 1;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1022
    if( k < ARRAY_SIZE(unroll_factor)) trip_count = unroll_factor[k];
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1023
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1024
    // If the unroll factor is not too large, and if conditional moves are
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1025
    // ok, then use this case
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1026
    if( trip_count <= 5 && ConditionalMoveLimit != 0 ) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1027
      Node *x = in(1);            // Value being mod'd
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1028
      Node *divisor = in(2);      // Also is mask
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1029
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1030
      hook->init_req(0, x);       // Add a use to x to prevent him from dying
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1031
      // Generate code to reduce X rapidly to nearly 2^k-1.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1032
      for( int i = 0; i < trip_count; i++ ) {
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1033
        Node *xl = phase->transform( new (phase->C, 3) AndLNode(x,divisor) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1034
        Node *xh = phase->transform( new (phase->C, 3) RShiftLNode(x,phase->intcon(k)) ); // Must be signed
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1035
        x = phase->transform( new (phase->C, 3) AddLNode(xh,xl) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1036
        hook->set_req(0, x);    // Add a use to x to prevent him from dying
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1037
      }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1038
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1039
      // Generate sign-fixup code.  Was original value positive?
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1040
      // long hack_res = (i >= 0) ? divisor : CONST64(1);
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1041
      Node *cmp1 = phase->transform( new (phase->C, 3) CmpLNode( in(1), phase->longcon(0) ) );
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1042
      Node *bol1 = phase->transform( new (phase->C, 2) BoolNode( cmp1, BoolTest::ge ) );
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1043
      Node *cmov1= phase->transform( new (phase->C, 4) CMoveLNode(bol1, phase->longcon(1), divisor, TypeLong::LONG) );
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1044
      // if( x >= hack_res ) x -= divisor;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1045
      Node *sub  = phase->transform( new (phase->C, 3) SubLNode( x, divisor ) );
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1046
      Node *cmp2 = phase->transform( new (phase->C, 3) CmpLNode( x, cmov1 ) );
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1047
      Node *bol2 = phase->transform( new (phase->C, 2) BoolNode( cmp2, BoolTest::ge ) );
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1048
      // Convention is to not transform the return value of an Ideal
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1049
      // since Ideal is expected to return a modified 'this' or a new node.
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1050
      Node *cmov2= new (phase->C, 4) CMoveLNode(bol2, x, sub, TypeLong::LONG);
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1051
      // cmov2 is now the mod
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1052
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1053
      // Now remove the bogus extra edges used to keep things alive
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1054
      if (can_reshape) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1055
        phase->is_IterGVN()->remove_dead_node(hook);
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1056
      } else {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1057
        hook->set_req(0, NULL);   // Just yank bogus edge during Parse phase
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1058
      }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1059
      return cmov2;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1060
    }
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1061
  }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1062
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1063
  // Fell thru, the unroll case is not appropriate. Transform the modulo
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1064
  // into a long multiply/int multiply/subtract case
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1065
7115
32300e243300 6987135: Performance regression on Intel platform with 32-bits edition between 6u13 and 6u14.
kvn
parents: 5547
diff changeset
  1066
  // Cannot handle mod 0, and min_jlong isn't handled by the transform
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1067
  if( con == 0 || con == min_jlong ) return NULL;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1068
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1069
  // Get the absolute value of the constant; at this point, we can use this
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1070
  jlong pos_con = (con >= 0) ? con : -con;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1071
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1072
  // integer Mod 1 is always 0
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1073
  if( pos_con == 1 ) return new (phase->C, 1) ConLNode(TypeLong::ZERO);
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1074
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1075
  int log2_con = -1;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1076
2131
98f9cef66a34 6810672: Comment typos
twisti
parents: 2032
diff changeset
  1077
  // If this is a power of two, then maybe we can mask it
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1078
  if( is_power_of_2_long(pos_con) ) {
7115
32300e243300 6987135: Performance regression on Intel platform with 32-bits edition between 6u13 and 6u14.
kvn
parents: 5547
diff changeset
  1079
    log2_con = exact_log2_long(pos_con);
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1080
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1081
    const Type *dt = phase->type(in(1));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1082
    const TypeLong *dtl = dt->isa_long();
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1083
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1084
    // See if this can be masked, if the dividend is non-negative
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1085
    if( dtl && dtl->_lo >= 0 )
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1086
      return ( new (phase->C, 3) AndLNode( in(1), phase->longcon( pos_con-1 ) ) );
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1087
  }
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1088
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1089
  // Save in(1) so that it cannot be changed or deleted
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1090
  hook->init_req(0, in(1));
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1091
7115
32300e243300 6987135: Performance regression on Intel platform with 32-bits edition between 6u13 and 6u14.
kvn
parents: 5547
diff changeset
  1092
  // Divide using the transform from DivL to MulL
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1093
  Node *result = transform_long_divide( phase, in(1), pos_con );
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1094
  if (result != NULL) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1095
    Node *divide = phase->transform(result);
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1096
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1097
    // Re-multiply, using a shift if this is a power of two
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1098
    Node *mult = NULL;
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1099
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1100
    if( log2_con >= 0 )
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1101
      mult = phase->transform( new (phase->C, 3) LShiftLNode( divide, phase->intcon( log2_con ) ) );
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1102
    else
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1103
      mult = phase->transform( new (phase->C, 3) MulLNode( divide, phase->longcon( pos_con ) ) );
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1104
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1105
    // Finally, subtract the multiplied divided value from the original
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1106
    result = new (phase->C, 3) SubLNode( in(1), mult );
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1107
  }
392
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1108
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1109
  // Now remove the bogus extra edges used to keep things alive
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1110
  if (can_reshape) {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1111
    phase->is_IterGVN()->remove_dead_node(hook);
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1112
  } else {
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1113
    hook->set_req(0, NULL);       // Just yank bogus edge during Parse phase
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1114
  }
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1115
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1116
  // return the value
0b3167e2f2de 6603011: RFE: Optimize long division
rasbold
parents: 378
diff changeset
  1117
  return result;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1118
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1119
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1120
//------------------------------Value------------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1121
const Type *ModLNode::Value( PhaseTransform *phase ) const {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1122
  // Either input is TOP ==> the result is TOP
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1123
  const Type *t1 = phase->type( in(1) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1124
  const Type *t2 = phase->type( in(2) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1125
  if( t1 == Type::TOP ) return Type::TOP;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1126
  if( t2 == Type::TOP ) return Type::TOP;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1127
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1128
  // We always generate the dynamic check for 0.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1129
  // 0 MOD X is 0
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1130
  if( t1 == TypeLong::ZERO ) return TypeLong::ZERO;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1131
  // X MOD X is 0
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1132
  if( phase->eqv( in(1), in(2) ) ) return TypeLong::ZERO;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1133
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1134
  // Either input is BOTTOM ==> the result is the local BOTTOM
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1135
  const Type *bot = bottom_type();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1136
  if( (t1 == bot) || (t2 == bot) ||
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1137
      (t1 == Type::BOTTOM) || (t2 == Type::BOTTOM) )
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1138
    return bot;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1139
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1140
  const TypeLong *i1 = t1->is_long();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1141
  const TypeLong *i2 = t2->is_long();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1142
  if( !i1->is_con() || !i2->is_con() ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1143
    if( i1->_lo >= CONST64(0) && i2->_lo >= CONST64(0) )
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1144
      return TypeLong::POS;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1145
    // If both numbers are not constants, we know little.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1146
    return TypeLong::LONG;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1147
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1148
  // Mod by zero?  Throw exception at runtime!
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1149
  if( !i2->get_con() ) return TypeLong::POS;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1150
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1151
  // We must be modulo'ing 2 float constants.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1152
  // Check for min_jint % '-1', result is defined to be '0'.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1153
  if( i1->get_con() == min_jlong && i2->get_con() == -1 )
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1154
    return TypeLong::ZERO;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1155
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1156
  return TypeLong::make( i1->get_con() % i2->get_con() );
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1157
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1158
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1159
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1160
//=============================================================================
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1161
//------------------------------Value------------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1162
const Type *ModFNode::Value( PhaseTransform *phase ) const {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1163
  // Either input is TOP ==> the result is TOP
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1164
  const Type *t1 = phase->type( in(1) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1165
  const Type *t2 = phase->type( in(2) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1166
  if( t1 == Type::TOP ) return Type::TOP;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1167
  if( t2 == Type::TOP ) return Type::TOP;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1168
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1169
  // Either input is BOTTOM ==> the result is the local BOTTOM
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1170
  const Type *bot = bottom_type();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1171
  if( (t1 == bot) || (t2 == bot) ||
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1172
      (t1 == Type::BOTTOM) || (t2 == Type::BOTTOM) )
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1173
    return bot;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1174
378
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1175
  // If either number is not a constant, we know nothing.
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1176
  if ((t1->base() != Type::FloatCon) || (t2->base() != Type::FloatCon)) {
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1177
    return Type::FLOAT;         // note: x%x can be either NaN or 0
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1178
  }
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1179
378
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1180
  float f1 = t1->getf();
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1181
  float f2 = t2->getf();
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1182
  jint  x1 = jint_cast(f1);     // note:  *(int*)&f1, not just (int)f1
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1183
  jint  x2 = jint_cast(f2);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1184
378
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1185
  // If either is a NaN, return an input NaN
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1186
  if (g_isnan(f1))    return t1;
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1187
  if (g_isnan(f2))    return t2;
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1188
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1189
  // If an operand is infinity or the divisor is +/- zero, punt.
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1190
  if (!g_isfinite(f1) || !g_isfinite(f2) || x2 == 0 || x2 == min_jint)
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1191
    return Type::FLOAT;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1192
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1193
  // We must be modulo'ing 2 float constants.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1194
  // Make sure that the sign of the fmod is equal to the sign of the dividend
378
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1195
  jint xr = jint_cast(fmod(f1, f2));
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1196
  if ((x1 ^ xr) < 0) {
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1197
    xr ^= min_jint;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1198
  }
378
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1199
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1200
  return TypeF::make(jfloat_cast(xr));
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1201
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1202
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1203
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1204
//=============================================================================
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1205
//------------------------------Value------------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1206
const Type *ModDNode::Value( PhaseTransform *phase ) const {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1207
  // Either input is TOP ==> the result is TOP
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1208
  const Type *t1 = phase->type( in(1) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1209
  const Type *t2 = phase->type( in(2) );
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1210
  if( t1 == Type::TOP ) return Type::TOP;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1211
  if( t2 == Type::TOP ) return Type::TOP;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1212
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1213
  // Either input is BOTTOM ==> the result is the local BOTTOM
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1214
  const Type *bot = bottom_type();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1215
  if( (t1 == bot) || (t2 == bot) ||
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1216
      (t1 == Type::BOTTOM) || (t2 == Type::BOTTOM) )
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1217
    return bot;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1218
378
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1219
  // If either number is not a constant, we know nothing.
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1220
  if ((t1->base() != Type::DoubleCon) || (t2->base() != Type::DoubleCon)) {
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1221
    return Type::DOUBLE;        // note: x%x can be either NaN or 0
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1222
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1223
378
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1224
  double f1 = t1->getd();
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1225
  double f2 = t2->getd();
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1226
  jlong  x1 = jlong_cast(f1);   // note:  *(long*)&f1, not just (long)f1
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1227
  jlong  x2 = jlong_cast(f2);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1228
378
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1229
  // If either is a NaN, return an input NaN
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1230
  if (g_isnan(f1))    return t1;
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1231
  if (g_isnan(f2))    return t2;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1232
378
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1233
  // If an operand is infinity or the divisor is +/- zero, punt.
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1234
  if (!g_isfinite(f1) || !g_isfinite(f2) || x2 == 0 || x2 == min_jlong)
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1235
    return Type::DOUBLE;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1236
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1237
  // We must be modulo'ing 2 double constants.
378
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1238
  // Make sure that the sign of the fmod is equal to the sign of the dividend
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1239
  jlong xr = jlong_cast(fmod(f1, f2));
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1240
  if ((x1 ^ xr) < 0) {
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1241
    xr ^= min_jlong;
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1242
  }
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1243
39fb2dc78042 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 1
diff changeset
  1244
  return TypeD::make(jdouble_cast(xr));
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1245
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1246
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1247
//=============================================================================
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1248
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1249
DivModNode::DivModNode( Node *c, Node *dividend, Node *divisor ) : MultiNode(3) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1250
  init_req(0, c);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1251
  init_req(1, dividend);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1252
  init_req(2, divisor);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1253
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1254
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1255
//------------------------------make------------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1256
DivModINode* DivModINode::make(Compile* C, Node* div_or_mod) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1257
  Node* n = div_or_mod;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1258
  assert(n->Opcode() == Op_DivI || n->Opcode() == Op_ModI,
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1259
         "only div or mod input pattern accepted");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1260
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1261
  DivModINode* divmod = new (C, 3) DivModINode(n->in(0), n->in(1), n->in(2));
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1262
  Node*        dproj  = new (C, 1) ProjNode(divmod, DivModNode::div_proj_num);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1263
  Node*        mproj  = new (C, 1) ProjNode(divmod, DivModNode::mod_proj_num);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1264
  return divmod;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1265
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1266
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1267
//------------------------------make------------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1268
DivModLNode* DivModLNode::make(Compile* C, Node* div_or_mod) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1269
  Node* n = div_or_mod;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1270
  assert(n->Opcode() == Op_DivL || n->Opcode() == Op_ModL,
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1271
         "only div or mod input pattern accepted");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1272
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1273
  DivModLNode* divmod = new (C, 3) DivModLNode(n->in(0), n->in(1), n->in(2));
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1274
  Node*        dproj  = new (C, 1) ProjNode(divmod, DivModNode::div_proj_num);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1275
  Node*        mproj  = new (C, 1) ProjNode(divmod, DivModNode::mod_proj_num);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1276
  return divmod;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1277
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1278
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1279
//------------------------------match------------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1280
// return result(s) along with their RegMask info
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1281
Node *DivModINode::match( const ProjNode *proj, const Matcher *match ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1282
  uint ideal_reg = proj->ideal_reg();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1283
  RegMask rm;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1284
  if (proj->_con == div_proj_num) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1285
    rm = match->divI_proj_mask();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1286
  } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1287
    assert(proj->_con == mod_proj_num, "must be div or mod projection");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1288
    rm = match->modI_proj_mask();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1289
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1290
  return new (match->C, 1)MachProjNode(this, proj->_con, rm, ideal_reg);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1291
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1292
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1293
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1294
//------------------------------match------------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1295
// return result(s) along with their RegMask info
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1296
Node *DivModLNode::match( const ProjNode *proj, const Matcher *match ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1297
  uint ideal_reg = proj->ideal_reg();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1298
  RegMask rm;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1299
  if (proj->_con == div_proj_num) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1300
    rm = match->divL_proj_mask();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1301
  } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1302
    assert(proj->_con == mod_proj_num, "must be div or mod projection");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1303
    rm = match->modL_proj_mask();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1304
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1305
  return new (match->C, 1)MachProjNode(this, proj->_con, rm, ideal_reg);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1306
}