hotspot/src/share/vm/opto/gcm.cpp
author coleenp
Mon, 14 Jan 2013 11:01:39 -0500
changeset 15194 a35093d73168
parent 14623 70c4c1be0a14
child 15871 b04dd94da4e6
permissions -rw-r--r--
8006005: Fix constant pool index validation and alignment trap for method parameter reflection Summary: This patch addresses an alignment trap due to the storage format of method parameters data in constMethod. It also adds code to validate constant pool indexes for method parameters data. Reviewed-by: jrose, dholmes Contributed-by: eric.mccorkle@oracle.com
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
     1
/*
13963
e5b53c306fb5 7197424: update copyright year to match last edit in jdk8 hotspot repository
mikael
parents: 11567
diff changeset
     2
 * Copyright (c) 1997, 2012, Oracle and/or its affiliates. All rights reserved.
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
     3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
489c9b5090e2 Initial load
duke
parents:
diff changeset
     4
 *
489c9b5090e2 Initial load
duke
parents:
diff changeset
     5
 * This code is free software; you can redistribute it and/or modify it
489c9b5090e2 Initial load
duke
parents:
diff changeset
     6
 * under the terms of the GNU General Public License version 2 only, as
489c9b5090e2 Initial load
duke
parents:
diff changeset
     7
 * published by the Free Software Foundation.
489c9b5090e2 Initial load
duke
parents:
diff changeset
     8
 *
489c9b5090e2 Initial load
duke
parents:
diff changeset
     9
 * This code is distributed in the hope that it will be useful, but WITHOUT
489c9b5090e2 Initial load
duke
parents:
diff changeset
    10
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
489c9b5090e2 Initial load
duke
parents:
diff changeset
    11
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
489c9b5090e2 Initial load
duke
parents:
diff changeset
    12
 * version 2 for more details (a copy is included in the LICENSE file that
489c9b5090e2 Initial load
duke
parents:
diff changeset
    13
 * accompanied this code).
489c9b5090e2 Initial load
duke
parents:
diff changeset
    14
 *
489c9b5090e2 Initial load
duke
parents:
diff changeset
    15
 * You should have received a copy of the GNU General Public License version
489c9b5090e2 Initial load
duke
parents:
diff changeset
    16
 * 2 along with this work; if not, write to the Free Software Foundation,
489c9b5090e2 Initial load
duke
parents:
diff changeset
    17
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
489c9b5090e2 Initial load
duke
parents:
diff changeset
    18
 *
5547
f4b087cbb361 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 3186
diff changeset
    19
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
f4b087cbb361 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 3186
diff changeset
    20
 * or visit www.oracle.com if you need additional information or have any
f4b087cbb361 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 3186
diff changeset
    21
 * questions.
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    22
 *
489c9b5090e2 Initial load
duke
parents:
diff changeset
    23
 */
489c9b5090e2 Initial load
duke
parents:
diff changeset
    24
7397
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    25
#include "precompiled.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    26
#include "libadt/vectset.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    27
#include "memory/allocation.inline.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    28
#include "opto/block.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    29
#include "opto/c2compiler.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    30
#include "opto/callnode.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    31
#include "opto/cfgnode.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    32
#include "opto/machnode.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    33
#include "opto/opcodes.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    34
#include "opto/phaseX.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    35
#include "opto/rootnode.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    36
#include "opto/runtime.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    37
#include "runtime/deoptimization.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    38
#ifdef TARGET_ARCH_MODEL_x86_32
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    39
# include "adfiles/ad_x86_32.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    40
#endif
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    41
#ifdef TARGET_ARCH_MODEL_x86_64
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    42
# include "adfiles/ad_x86_64.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    43
#endif
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    44
#ifdef TARGET_ARCH_MODEL_sparc
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    45
# include "adfiles/ad_sparc.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    46
#endif
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    47
#ifdef TARGET_ARCH_MODEL_zero
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    48
# include "adfiles/ad_zero.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    49
#endif
8107
78e5bd944384 7016023: Enable building ARM and PPC from src/closed repository
bobv
parents: 7433
diff changeset
    50
#ifdef TARGET_ARCH_MODEL_arm
78e5bd944384 7016023: Enable building ARM and PPC from src/closed repository
bobv
parents: 7433
diff changeset
    51
# include "adfiles/ad_arm.hpp"
78e5bd944384 7016023: Enable building ARM and PPC from src/closed repository
bobv
parents: 7433
diff changeset
    52
#endif
78e5bd944384 7016023: Enable building ARM and PPC from src/closed repository
bobv
parents: 7433
diff changeset
    53
#ifdef TARGET_ARCH_MODEL_ppc
78e5bd944384 7016023: Enable building ARM and PPC from src/closed repository
bobv
parents: 7433
diff changeset
    54
# include "adfiles/ad_ppc.hpp"
78e5bd944384 7016023: Enable building ARM and PPC from src/closed repository
bobv
parents: 7433
diff changeset
    55
#endif
7397
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6180
diff changeset
    56
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    57
// Portions of code courtesy of Clifford Click
489c9b5090e2 Initial load
duke
parents:
diff changeset
    58
489c9b5090e2 Initial load
duke
parents:
diff changeset
    59
// Optimization - Graph Style
489c9b5090e2 Initial load
duke
parents:
diff changeset
    60
2016
c1f73fa547fe 6784930: server jvm fails with assert(!n->is_SpillCopy(),"")
kvn
parents: 1498
diff changeset
    61
// To avoid float value underflow
c1f73fa547fe 6784930: server jvm fails with assert(!n->is_SpillCopy(),"")
kvn
parents: 1498
diff changeset
    62
#define MIN_BLOCK_FREQUENCY 1.e-35f
c1f73fa547fe 6784930: server jvm fails with assert(!n->is_SpillCopy(),"")
kvn
parents: 1498
diff changeset
    63
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    64
//----------------------------schedule_node_into_block-------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
    65
// Insert node n into block b. Look for projections of n and make sure they
489c9b5090e2 Initial load
duke
parents:
diff changeset
    66
// are in b also.
489c9b5090e2 Initial load
duke
parents:
diff changeset
    67
void PhaseCFG::schedule_node_into_block( Node *n, Block *b ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    68
  // Set basic block of n, Add n to b,
489c9b5090e2 Initial load
duke
parents:
diff changeset
    69
  _bbs.map(n->_idx, b);
489c9b5090e2 Initial load
duke
parents:
diff changeset
    70
  b->add_inst(n);
489c9b5090e2 Initial load
duke
parents:
diff changeset
    71
489c9b5090e2 Initial load
duke
parents:
diff changeset
    72
  // After Matching, nearly any old Node may have projections trailing it.
489c9b5090e2 Initial load
duke
parents:
diff changeset
    73
  // These are usually machine-dependent flags.  In any case, they might
489c9b5090e2 Initial load
duke
parents:
diff changeset
    74
  // float to another block below this one.  Move them up.
489c9b5090e2 Initial load
duke
parents:
diff changeset
    75
  for (DUIterator_Fast imax, i = n->fast_outs(imax); i < imax; i++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    76
    Node*  use  = n->fast_out(i);
489c9b5090e2 Initial load
duke
parents:
diff changeset
    77
    if (use->is_Proj()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    78
      Block* buse = _bbs[use->_idx];
489c9b5090e2 Initial load
duke
parents:
diff changeset
    79
      if (buse != b) {              // In wrong block?
489c9b5090e2 Initial load
duke
parents:
diff changeset
    80
        if (buse != NULL)
489c9b5090e2 Initial load
duke
parents:
diff changeset
    81
          buse->find_remove(use);   // Remove from wrong block
489c9b5090e2 Initial load
duke
parents:
diff changeset
    82
        _bbs.map(use->_idx, b);     // Re-insert in this block
489c9b5090e2 Initial load
duke
parents:
diff changeset
    83
        b->add_inst(use);
489c9b5090e2 Initial load
duke
parents:
diff changeset
    84
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    85
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    86
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    87
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
    88
2127
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
    89
//----------------------------replace_block_proj_ctrl-------------------------
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
    90
// Nodes that have is_block_proj() nodes as their control need to use
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
    91
// the appropriate Region for their actual block as their control since
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
    92
// the projection will be in a predecessor block.
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
    93
void PhaseCFG::replace_block_proj_ctrl( Node *n ) {
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
    94
  const Node *in0 = n->in(0);
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
    95
  assert(in0 != NULL, "Only control-dependent");
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
    96
  const Node *p = in0->is_block_proj();
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
    97
  if (p != NULL && p != n) {    // Control from a block projection?
11191
d54ab5dcba83 6890673: Eliminate allocations immediately after EA
kvn
parents: 10255
diff changeset
    98
    assert(!n->pinned() || n->is_MachConstantBase(), "only pinned MachConstantBase node is expected here");
2127
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
    99
    // Find trailing Region
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   100
    Block *pb = _bbs[in0->_idx]; // Block-projection already has basic block
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   101
    uint j = 0;
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   102
    if (pb->_num_succs != 1) {  // More then 1 successor?
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   103
      // Search for successor
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   104
      uint max = pb->_nodes.size();
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   105
      assert( max > 1, "" );
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   106
      uint start = max - pb->_num_succs;
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   107
      // Find which output path belongs to projection
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   108
      for (j = start; j < max; j++) {
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   109
        if( pb->_nodes[j] == in0 )
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   110
          break;
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   111
      }
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   112
      assert( j < max, "must find" );
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   113
      // Change control to match head of successor basic block
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   114
      j -= start;
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   115
    }
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   116
    n->set_req(0, pb->_succs[j]->head());
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   117
  }
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   118
}
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   119
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   120
489c9b5090e2 Initial load
duke
parents:
diff changeset
   121
//------------------------------schedule_pinned_nodes--------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   122
// Set the basic block for Nodes pinned into blocks
489c9b5090e2 Initial load
duke
parents:
diff changeset
   123
void PhaseCFG::schedule_pinned_nodes( VectorSet &visited ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   124
  // Allocate node stack of size C->unique()+8 to avoid frequent realloc
489c9b5090e2 Initial load
duke
parents:
diff changeset
   125
  GrowableArray <Node *> spstack(C->unique()+8);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   126
  spstack.push(_root);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   127
  while ( spstack.is_nonempty() ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   128
    Node *n = spstack.pop();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   129
    if( !visited.test_set(n->_idx) ) { // Test node and flag it as visited
489c9b5090e2 Initial load
duke
parents:
diff changeset
   130
      if( n->pinned() && !_bbs.lookup(n->_idx) ) {  // Pinned?  Nail it down!
2127
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   131
        assert( n->in(0), "pinned Node must have Control" );
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   132
        // Before setting block replace block_proj control edge
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   133
        replace_block_proj_ctrl(n);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   134
        Node *input = n->in(0);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   135
        while( !input->is_block_start() )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   136
          input = input->in(0);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   137
        Block *b = _bbs[input->_idx];  // Basic block of controlling input
489c9b5090e2 Initial load
duke
parents:
diff changeset
   138
        schedule_node_into_block(n, b);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   139
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   140
      for( int i = n->req() - 1; i >= 0; --i ) {  // For all inputs
489c9b5090e2 Initial load
duke
parents:
diff changeset
   141
        if( n->in(i) != NULL )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   142
          spstack.push(n->in(i));
489c9b5090e2 Initial load
duke
parents:
diff changeset
   143
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   144
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   145
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   146
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   147
489c9b5090e2 Initial load
duke
parents:
diff changeset
   148
#ifdef ASSERT
489c9b5090e2 Initial load
duke
parents:
diff changeset
   149
// Assert that new input b2 is dominated by all previous inputs.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   150
// Check this by by seeing that it is dominated by b1, the deepest
489c9b5090e2 Initial load
duke
parents:
diff changeset
   151
// input observed until b2.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   152
static void assert_dom(Block* b1, Block* b2, Node* n, Block_Array &bbs) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   153
  if (b1 == NULL)  return;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   154
  assert(b1->_dom_depth < b2->_dom_depth, "sanity");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   155
  Block* tmp = b2;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   156
  while (tmp != b1 && tmp != NULL) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   157
    tmp = tmp->_idom;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   158
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   159
  if (tmp != b1) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   160
    // Detected an unschedulable graph.  Print some nice stuff and die.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   161
    tty->print_cr("!!! Unschedulable graph !!!");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   162
    for (uint j=0; j<n->len(); j++) { // For all inputs
489c9b5090e2 Initial load
duke
parents:
diff changeset
   163
      Node* inn = n->in(j); // Get input
489c9b5090e2 Initial load
duke
parents:
diff changeset
   164
      if (inn == NULL)  continue;  // Ignore NULL, missing inputs
489c9b5090e2 Initial load
duke
parents:
diff changeset
   165
      Block* inb = bbs[inn->_idx];
489c9b5090e2 Initial load
duke
parents:
diff changeset
   166
      tty->print("B%d idom=B%d depth=%2d ",inb->_pre_order,
489c9b5090e2 Initial load
duke
parents:
diff changeset
   167
                 inb->_idom ? inb->_idom->_pre_order : 0, inb->_dom_depth);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   168
      inn->dump();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   169
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   170
    tty->print("Failing node: ");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   171
    n->dump();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   172
    assert(false, "unscheduable graph");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   173
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   174
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   175
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
   176
489c9b5090e2 Initial load
duke
parents:
diff changeset
   177
static Block* find_deepest_input(Node* n, Block_Array &bbs) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   178
  // Find the last input dominated by all other inputs.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   179
  Block* deepb           = NULL;        // Deepest block so far
489c9b5090e2 Initial load
duke
parents:
diff changeset
   180
  int    deepb_dom_depth = 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   181
  for (uint k = 0; k < n->len(); k++) { // For all inputs
489c9b5090e2 Initial load
duke
parents:
diff changeset
   182
    Node* inn = n->in(k);               // Get input
489c9b5090e2 Initial load
duke
parents:
diff changeset
   183
    if (inn == NULL)  continue;         // Ignore NULL, missing inputs
489c9b5090e2 Initial load
duke
parents:
diff changeset
   184
    Block* inb = bbs[inn->_idx];
489c9b5090e2 Initial load
duke
parents:
diff changeset
   185
    assert(inb != NULL, "must already have scheduled this input");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   186
    if (deepb_dom_depth < (int) inb->_dom_depth) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   187
      // The new inb must be dominated by the previous deepb.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   188
      // The various inputs must be linearly ordered in the dom
489c9b5090e2 Initial load
duke
parents:
diff changeset
   189
      // tree, or else there will not be a unique deepest block.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   190
      DEBUG_ONLY(assert_dom(deepb, inb, n, bbs));
489c9b5090e2 Initial load
duke
parents:
diff changeset
   191
      deepb = inb;                      // Save deepest block
489c9b5090e2 Initial load
duke
parents:
diff changeset
   192
      deepb_dom_depth = deepb->_dom_depth;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   193
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   194
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   195
  assert(deepb != NULL, "must be at least one input to n");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   196
  return deepb;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   197
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   198
489c9b5090e2 Initial load
duke
parents:
diff changeset
   199
489c9b5090e2 Initial load
duke
parents:
diff changeset
   200
//------------------------------schedule_early---------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   201
// Find the earliest Block any instruction can be placed in.  Some instructions
489c9b5090e2 Initial load
duke
parents:
diff changeset
   202
// are pinned into Blocks.  Unpinned instructions can appear in last block in
489c9b5090e2 Initial load
duke
parents:
diff changeset
   203
// which all their inputs occur.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   204
bool PhaseCFG::schedule_early(VectorSet &visited, Node_List &roots) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   205
  // Allocate stack with enough space to avoid frequent realloc
489c9b5090e2 Initial load
duke
parents:
diff changeset
   206
  Node_Stack nstack(roots.Size() + 8); // (unique >> 1) + 24 from Java2D stats
489c9b5090e2 Initial load
duke
parents:
diff changeset
   207
  // roots.push(_root); _root will be processed among C->top() inputs
489c9b5090e2 Initial load
duke
parents:
diff changeset
   208
  roots.push(C->top());
489c9b5090e2 Initial load
duke
parents:
diff changeset
   209
  visited.set(C->top()->_idx);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   210
489c9b5090e2 Initial load
duke
parents:
diff changeset
   211
  while (roots.size() != 0) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   212
    // Use local variables nstack_top_n & nstack_top_i to cache values
489c9b5090e2 Initial load
duke
parents:
diff changeset
   213
    // on stack's top.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   214
    Node *nstack_top_n = roots.pop();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   215
    uint  nstack_top_i = 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   216
//while_nstack_nonempty:
489c9b5090e2 Initial load
duke
parents:
diff changeset
   217
    while (true) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   218
      // Get parent node and next input's index from stack's top.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   219
      Node *n = nstack_top_n;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   220
      uint  i = nstack_top_i;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   221
489c9b5090e2 Initial load
duke
parents:
diff changeset
   222
      if (i == 0) {
2127
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   223
        // Fixup some control.  Constants without control get attached
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   224
        // to root and nodes that use is_block_proj() nodes should be attached
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   225
        // to the region that starts their block.
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   226
        const Node *in0 = n->in(0);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   227
        if (in0 != NULL) {              // Control-dependent?
2127
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   228
          replace_block_proj_ctrl(n);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   229
        } else {               // n->in(0) == NULL
489c9b5090e2 Initial load
duke
parents:
diff changeset
   230
          if (n->req() == 1) { // This guy is a constant with NO inputs?
489c9b5090e2 Initial load
duke
parents:
diff changeset
   231
            n->set_req(0, _root);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   232
          }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   233
        }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   234
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   235
489c9b5090e2 Initial load
duke
parents:
diff changeset
   236
      // First, visit all inputs and force them to get a block.  If an
489c9b5090e2 Initial load
duke
parents:
diff changeset
   237
      // input is already in a block we quit following inputs (to avoid
489c9b5090e2 Initial load
duke
parents:
diff changeset
   238
      // cycles). Instead we put that Node on a worklist to be handled
489c9b5090e2 Initial load
duke
parents:
diff changeset
   239
      // later (since IT'S inputs may not have a block yet).
489c9b5090e2 Initial load
duke
parents:
diff changeset
   240
      bool done = true;              // Assume all n's inputs will be processed
489c9b5090e2 Initial load
duke
parents:
diff changeset
   241
      while (i < n->len()) {         // For all inputs
489c9b5090e2 Initial load
duke
parents:
diff changeset
   242
        Node *in = n->in(i);         // Get input
489c9b5090e2 Initial load
duke
parents:
diff changeset
   243
        ++i;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   244
        if (in == NULL) continue;    // Ignore NULL, missing inputs
489c9b5090e2 Initial load
duke
parents:
diff changeset
   245
        int is_visited = visited.test_set(in->_idx);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   246
        if (!_bbs.lookup(in->_idx)) { // Missing block selection?
489c9b5090e2 Initial load
duke
parents:
diff changeset
   247
          if (is_visited) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   248
            // assert( !visited.test(in->_idx), "did not schedule early" );
489c9b5090e2 Initial load
duke
parents:
diff changeset
   249
            return false;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   250
          }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   251
          nstack.push(n, i);         // Save parent node and next input's index.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   252
          nstack_top_n = in;         // Process current input now.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   253
          nstack_top_i = 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   254
          done = false;              // Not all n's inputs processed.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   255
          break; // continue while_nstack_nonempty;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   256
        } else if (!is_visited) {    // Input not yet visited?
489c9b5090e2 Initial load
duke
parents:
diff changeset
   257
          roots.push(in);            // Visit this guy later, using worklist
489c9b5090e2 Initial load
duke
parents:
diff changeset
   258
        }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   259
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   260
      if (done) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   261
        // All of n's inputs have been processed, complete post-processing.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   262
489c9b5090e2 Initial load
duke
parents:
diff changeset
   263
        // Some instructions are pinned into a block.  These include Region,
489c9b5090e2 Initial load
duke
parents:
diff changeset
   264
        // Phi, Start, Return, and other control-dependent instructions and
489c9b5090e2 Initial load
duke
parents:
diff changeset
   265
        // any projections which depend on them.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   266
        if (!n->pinned()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   267
          // Set earliest legal block.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   268
          _bbs.map(n->_idx, find_deepest_input(n, _bbs));
2127
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   269
        } else {
268ea58ed775 6809798: SafePointScalarObject node placed into incorrect block during GCM
kvn
parents: 2016
diff changeset
   270
          assert(_bbs[n->_idx] == _bbs[n->in(0)->_idx], "Pinned Node should be at the same block as its control edge");
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   271
        }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   272
489c9b5090e2 Initial load
duke
parents:
diff changeset
   273
        if (nstack.is_empty()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   274
          // Finished all nodes on stack.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   275
          // Process next node on the worklist 'roots'.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   276
          break;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   277
        }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   278
        // Get saved parent node and next input's index.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   279
        nstack_top_n = nstack.node();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   280
        nstack_top_i = nstack.index();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   281
        nstack.pop();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   282
      } //    if (done)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   283
    }   // while (true)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   284
  }     // while (roots.size() != 0)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   285
  return true;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   286
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   287
489c9b5090e2 Initial load
duke
parents:
diff changeset
   288
//------------------------------dom_lca----------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   289
// Find least common ancestor in dominator tree
489c9b5090e2 Initial load
duke
parents:
diff changeset
   290
// LCA is a current notion of LCA, to be raised above 'this'.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   291
// As a convenient boundary condition, return 'this' if LCA is NULL.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   292
// Find the LCA of those two nodes.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   293
Block* Block::dom_lca(Block* LCA) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   294
  if (LCA == NULL || LCA == this)  return this;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   295
489c9b5090e2 Initial load
duke
parents:
diff changeset
   296
  Block* anc = this;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   297
  while (anc->_dom_depth > LCA->_dom_depth)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   298
    anc = anc->_idom;           // Walk up till anc is as high as LCA
489c9b5090e2 Initial load
duke
parents:
diff changeset
   299
489c9b5090e2 Initial load
duke
parents:
diff changeset
   300
  while (LCA->_dom_depth > anc->_dom_depth)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   301
    LCA = LCA->_idom;           // Walk up till LCA is as high as anc
489c9b5090e2 Initial load
duke
parents:
diff changeset
   302
489c9b5090e2 Initial load
duke
parents:
diff changeset
   303
  while (LCA != anc) {          // Walk both up till they are the same
489c9b5090e2 Initial load
duke
parents:
diff changeset
   304
    LCA = LCA->_idom;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   305
    anc = anc->_idom;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   306
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   307
489c9b5090e2 Initial load
duke
parents:
diff changeset
   308
  return LCA;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   309
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   310
489c9b5090e2 Initial load
duke
parents:
diff changeset
   311
//--------------------------raise_LCA_above_use--------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   312
// We are placing a definition, and have been given a def->use edge.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   313
// The definition must dominate the use, so move the LCA upward in the
489c9b5090e2 Initial load
duke
parents:
diff changeset
   314
// dominator tree to dominate the use.  If the use is a phi, adjust
489c9b5090e2 Initial load
duke
parents:
diff changeset
   315
// the LCA only with the phi input paths which actually use this def.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   316
static Block* raise_LCA_above_use(Block* LCA, Node* use, Node* def, Block_Array &bbs) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   317
  Block* buse = bbs[use->_idx];
489c9b5090e2 Initial load
duke
parents:
diff changeset
   318
  if (buse == NULL)    return LCA;   // Unused killing Projs have no use block
489c9b5090e2 Initial load
duke
parents:
diff changeset
   319
  if (!use->is_Phi())  return buse->dom_lca(LCA);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   320
  uint pmax = use->req();       // Number of Phi inputs
489c9b5090e2 Initial load
duke
parents:
diff changeset
   321
  // Why does not this loop just break after finding the matching input to
489c9b5090e2 Initial load
duke
parents:
diff changeset
   322
  // the Phi?  Well...it's like this.  I do not have true def-use/use-def
489c9b5090e2 Initial load
duke
parents:
diff changeset
   323
  // chains.  Means I cannot distinguish, from the def-use direction, which
489c9b5090e2 Initial load
duke
parents:
diff changeset
   324
  // of many use-defs lead from the same use to the same def.  That is, this
489c9b5090e2 Initial load
duke
parents:
diff changeset
   325
  // Phi might have several uses of the same def.  Each use appears in a
489c9b5090e2 Initial load
duke
parents:
diff changeset
   326
  // different predecessor block.  But when I enter here, I cannot distinguish
489c9b5090e2 Initial load
duke
parents:
diff changeset
   327
  // which use-def edge I should find the predecessor block for.  So I find
489c9b5090e2 Initial load
duke
parents:
diff changeset
   328
  // them all.  Means I do a little extra work if a Phi uses the same value
489c9b5090e2 Initial load
duke
parents:
diff changeset
   329
  // more than once.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   330
  for (uint j=1; j<pmax; j++) { // For all inputs
489c9b5090e2 Initial load
duke
parents:
diff changeset
   331
    if (use->in(j) == def) {    // Found matching input?
489c9b5090e2 Initial load
duke
parents:
diff changeset
   332
      Block* pred = bbs[buse->pred(j)->_idx];
489c9b5090e2 Initial load
duke
parents:
diff changeset
   333
      LCA = pred->dom_lca(LCA);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   334
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   335
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   336
  return LCA;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   337
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   338
489c9b5090e2 Initial load
duke
parents:
diff changeset
   339
//----------------------------raise_LCA_above_marks----------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   340
// Return a new LCA that dominates LCA and any of its marked predecessors.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   341
// Search all my parents up to 'early' (exclusive), looking for predecessors
489c9b5090e2 Initial load
duke
parents:
diff changeset
   342
// which are marked with the given index.  Return the LCA (in the dom tree)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   343
// of all marked blocks.  If there are none marked, return the original
489c9b5090e2 Initial load
duke
parents:
diff changeset
   344
// LCA.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   345
static Block* raise_LCA_above_marks(Block* LCA, node_idx_t mark,
489c9b5090e2 Initial load
duke
parents:
diff changeset
   346
                                    Block* early, Block_Array &bbs) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   347
  Block_List worklist;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   348
  worklist.push(LCA);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   349
  while (worklist.size() > 0) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   350
    Block* mid = worklist.pop();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   351
    if (mid == early)  continue;  // stop searching here
489c9b5090e2 Initial load
duke
parents:
diff changeset
   352
489c9b5090e2 Initial load
duke
parents:
diff changeset
   353
    // Test and set the visited bit.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   354
    if (mid->raise_LCA_visited() == mark)  continue;  // already visited
489c9b5090e2 Initial load
duke
parents:
diff changeset
   355
489c9b5090e2 Initial load
duke
parents:
diff changeset
   356
    // Don't process the current LCA, otherwise the search may terminate early
489c9b5090e2 Initial load
duke
parents:
diff changeset
   357
    if (mid != LCA && mid->raise_LCA_mark() == mark) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   358
      // Raise the LCA.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   359
      LCA = mid->dom_lca(LCA);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   360
      if (LCA == early)  break;   // stop searching everywhere
489c9b5090e2 Initial load
duke
parents:
diff changeset
   361
      assert(early->dominates(LCA), "early is high enough");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   362
      // Resume searching at that point, skipping intermediate levels.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   363
      worklist.push(LCA);
761
312de898447e 6714694: assertion in 64bit server vm (store->find_edge(load) != -1,"missing precedence edge") with COOPs
kvn
parents: 204
diff changeset
   364
      if (LCA == mid)
312de898447e 6714694: assertion in 64bit server vm (store->find_edge(load) != -1,"missing precedence edge") with COOPs
kvn
parents: 204
diff changeset
   365
        continue; // Don't mark as visited to avoid early termination.
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   366
    } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   367
      // Keep searching through this block's predecessors.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   368
      for (uint j = 1, jmax = mid->num_preds(); j < jmax; j++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   369
        Block* mid_parent = bbs[ mid->pred(j)->_idx ];
489c9b5090e2 Initial load
duke
parents:
diff changeset
   370
        worklist.push(mid_parent);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   371
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   372
    }
761
312de898447e 6714694: assertion in 64bit server vm (store->find_edge(load) != -1,"missing precedence edge") with COOPs
kvn
parents: 204
diff changeset
   373
    mid->set_raise_LCA_visited(mark);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   374
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   375
  return LCA;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   376
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   377
489c9b5090e2 Initial load
duke
parents:
diff changeset
   378
//--------------------------memory_early_block--------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   379
// This is a variation of find_deepest_input, the heart of schedule_early.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   380
// Find the "early" block for a load, if we considered only memory and
489c9b5090e2 Initial load
duke
parents:
diff changeset
   381
// address inputs, that is, if other data inputs were ignored.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   382
//
489c9b5090e2 Initial load
duke
parents:
diff changeset
   383
// Because a subset of edges are considered, the resulting block will
489c9b5090e2 Initial load
duke
parents:
diff changeset
   384
// be earlier (at a shallower dom_depth) than the true schedule_early
489c9b5090e2 Initial load
duke
parents:
diff changeset
   385
// point of the node. We compute this earlier block as a more permissive
489c9b5090e2 Initial load
duke
parents:
diff changeset
   386
// site for anti-dependency insertion, but only if subsume_loads is enabled.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   387
static Block* memory_early_block(Node* load, Block* early, Block_Array &bbs) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   388
  Node* base;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   389
  Node* index;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   390
  Node* store = load->in(MemNode::Memory);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   391
  load->as_Mach()->memory_inputs(base, index);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   392
489c9b5090e2 Initial load
duke
parents:
diff changeset
   393
  assert(base != NodeSentinel && index != NodeSentinel,
489c9b5090e2 Initial load
duke
parents:
diff changeset
   394
         "unexpected base/index inputs");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   395
489c9b5090e2 Initial load
duke
parents:
diff changeset
   396
  Node* mem_inputs[4];
489c9b5090e2 Initial load
duke
parents:
diff changeset
   397
  int mem_inputs_length = 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   398
  if (base != NULL)  mem_inputs[mem_inputs_length++] = base;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   399
  if (index != NULL) mem_inputs[mem_inputs_length++] = index;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   400
  if (store != NULL) mem_inputs[mem_inputs_length++] = store;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   401
489c9b5090e2 Initial load
duke
parents:
diff changeset
   402
  // In the comparision below, add one to account for the control input,
489c9b5090e2 Initial load
duke
parents:
diff changeset
   403
  // which may be null, but always takes up a spot in the in array.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   404
  if (mem_inputs_length + 1 < (int) load->req()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   405
    // This "load" has more inputs than just the memory, base and index inputs.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   406
    // For purposes of checking anti-dependences, we need to start
489c9b5090e2 Initial load
duke
parents:
diff changeset
   407
    // from the early block of only the address portion of the instruction,
489c9b5090e2 Initial load
duke
parents:
diff changeset
   408
    // and ignore other blocks that may have factored into the wider
489c9b5090e2 Initial load
duke
parents:
diff changeset
   409
    // schedule_early calculation.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   410
    if (load->in(0) != NULL) mem_inputs[mem_inputs_length++] = load->in(0);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   411
489c9b5090e2 Initial load
duke
parents:
diff changeset
   412
    Block* deepb           = NULL;        // Deepest block so far
489c9b5090e2 Initial load
duke
parents:
diff changeset
   413
    int    deepb_dom_depth = 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   414
    for (int i = 0; i < mem_inputs_length; i++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   415
      Block* inb = bbs[mem_inputs[i]->_idx];
489c9b5090e2 Initial load
duke
parents:
diff changeset
   416
      if (deepb_dom_depth < (int) inb->_dom_depth) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   417
        // The new inb must be dominated by the previous deepb.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   418
        // The various inputs must be linearly ordered in the dom
489c9b5090e2 Initial load
duke
parents:
diff changeset
   419
        // tree, or else there will not be a unique deepest block.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   420
        DEBUG_ONLY(assert_dom(deepb, inb, load, bbs));
489c9b5090e2 Initial load
duke
parents:
diff changeset
   421
        deepb = inb;                      // Save deepest block
489c9b5090e2 Initial load
duke
parents:
diff changeset
   422
        deepb_dom_depth = deepb->_dom_depth;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   423
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   424
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   425
    early = deepb;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   426
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   427
489c9b5090e2 Initial load
duke
parents:
diff changeset
   428
  return early;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   429
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   430
489c9b5090e2 Initial load
duke
parents:
diff changeset
   431
//--------------------------insert_anti_dependences---------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   432
// A load may need to witness memory that nearby stores can overwrite.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   433
// For each nearby store, either insert an "anti-dependence" edge
489c9b5090e2 Initial load
duke
parents:
diff changeset
   434
// from the load to the store, or else move LCA upward to force the
489c9b5090e2 Initial load
duke
parents:
diff changeset
   435
// load to (eventually) be scheduled in a block above the store.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   436
//
489c9b5090e2 Initial load
duke
parents:
diff changeset
   437
// Do not add edges to stores on distinct control-flow paths;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   438
// only add edges to stores which might interfere.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   439
//
489c9b5090e2 Initial load
duke
parents:
diff changeset
   440
// Return the (updated) LCA.  There will not be any possibly interfering
489c9b5090e2 Initial load
duke
parents:
diff changeset
   441
// store between the load's "early block" and the updated LCA.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   442
// Any stores in the updated LCA will have new precedence edges
489c9b5090e2 Initial load
duke
parents:
diff changeset
   443
// back to the load.  The caller is expected to schedule the load
489c9b5090e2 Initial load
duke
parents:
diff changeset
   444
// in the LCA, in which case the precedence edges will make LCM
489c9b5090e2 Initial load
duke
parents:
diff changeset
   445
// preserve anti-dependences.  The caller may also hoist the load
489c9b5090e2 Initial load
duke
parents:
diff changeset
   446
// above the LCA, if it is not the early block.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   447
Block* PhaseCFG::insert_anti_dependences(Block* LCA, Node* load, bool verify) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   448
  assert(load->needs_anti_dependence_check(), "must be a load of some sort");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   449
  assert(LCA != NULL, "");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   450
  DEBUG_ONLY(Block* LCA_orig = LCA);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   451
489c9b5090e2 Initial load
duke
parents:
diff changeset
   452
  // Compute the alias index.  Loads and stores with different alias indices
489c9b5090e2 Initial load
duke
parents:
diff changeset
   453
  // do not need anti-dependence edges.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   454
  uint load_alias_idx = C->get_alias_index(load->adr_type());
489c9b5090e2 Initial load
duke
parents:
diff changeset
   455
#ifdef ASSERT
489c9b5090e2 Initial load
duke
parents:
diff changeset
   456
  if (load_alias_idx == Compile::AliasIdxBot && C->AliasLevel() > 0 &&
489c9b5090e2 Initial load
duke
parents:
diff changeset
   457
      (PrintOpto || VerifyAliases ||
489c9b5090e2 Initial load
duke
parents:
diff changeset
   458
       PrintMiscellaneous && (WizardMode || Verbose))) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   459
    // Load nodes should not consume all of memory.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   460
    // Reporting a bottom type indicates a bug in adlc.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   461
    // If some particular type of node validly consumes all of memory,
489c9b5090e2 Initial load
duke
parents:
diff changeset
   462
    // sharpen the preceding "if" to exclude it, so we can catch bugs here.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   463
    tty->print_cr("*** Possible Anti-Dependence Bug:  Load consumes all of memory.");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   464
    load->dump(2);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   465
    if (VerifyAliases)  assert(load_alias_idx != Compile::AliasIdxBot, "");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   466
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   467
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
   468
  assert(load_alias_idx || (load->is_Mach() && load->as_Mach()->ideal_Opcode() == Op_StrComp),
489c9b5090e2 Initial load
duke
parents:
diff changeset
   469
         "String compare is only known 'load' that does not conflict with any stores");
2348
4e71ed4c2709 6761600: Use sse 4.2 in intrinsics
cfang
parents: 2340
diff changeset
   470
  assert(load_alias_idx || (load->is_Mach() && load->as_Mach()->ideal_Opcode() == Op_StrEquals),
4e71ed4c2709 6761600: Use sse 4.2 in intrinsics
cfang
parents: 2340
diff changeset
   471
         "String equals is a 'load' that does not conflict with any stores");
4e71ed4c2709 6761600: Use sse 4.2 in intrinsics
cfang
parents: 2340
diff changeset
   472
  assert(load_alias_idx || (load->is_Mach() && load->as_Mach()->ideal_Opcode() == Op_StrIndexOf),
4e71ed4c2709 6761600: Use sse 4.2 in intrinsics
cfang
parents: 2340
diff changeset
   473
         "String indexOf is a 'load' that does not conflict with any stores");
4e71ed4c2709 6761600: Use sse 4.2 in intrinsics
cfang
parents: 2340
diff changeset
   474
  assert(load_alias_idx || (load->is_Mach() && load->as_Mach()->ideal_Opcode() == Op_AryEq),
4e71ed4c2709 6761600: Use sse 4.2 in intrinsics
cfang
parents: 2340
diff changeset
   475
         "Arrays equals is a 'load' that do not conflict with any stores");
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   476
489c9b5090e2 Initial load
duke
parents:
diff changeset
   477
  if (!C->alias_type(load_alias_idx)->is_rewritable()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   478
    // It is impossible to spoil this load by putting stores before it,
489c9b5090e2 Initial load
duke
parents:
diff changeset
   479
    // because we know that the stores will never update the value
489c9b5090e2 Initial load
duke
parents:
diff changeset
   480
    // which 'load' must witness.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   481
    return LCA;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   482
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   483
489c9b5090e2 Initial load
duke
parents:
diff changeset
   484
  node_idx_t load_index = load->_idx;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   485
489c9b5090e2 Initial load
duke
parents:
diff changeset
   486
  // Note the earliest legal placement of 'load', as determined by
489c9b5090e2 Initial load
duke
parents:
diff changeset
   487
  // by the unique point in the dom tree where all memory effects
489c9b5090e2 Initial load
duke
parents:
diff changeset
   488
  // and other inputs are first available.  (Computed by schedule_early.)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   489
  // For normal loads, 'early' is the shallowest place (dom graph wise)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   490
  // to look for anti-deps between this load and any store.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   491
  Block* early = _bbs[load_index];
489c9b5090e2 Initial load
duke
parents:
diff changeset
   492
489c9b5090e2 Initial load
duke
parents:
diff changeset
   493
  // If we are subsuming loads, compute an "early" block that only considers
489c9b5090e2 Initial load
duke
parents:
diff changeset
   494
  // memory or address inputs. This block may be different than the
489c9b5090e2 Initial load
duke
parents:
diff changeset
   495
  // schedule_early block in that it could be at an even shallower depth in the
489c9b5090e2 Initial load
duke
parents:
diff changeset
   496
  // dominator tree, and allow for a broader discovery of anti-dependences.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   497
  if (C->subsume_loads()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   498
    early = memory_early_block(load, early, _bbs);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   499
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   500
489c9b5090e2 Initial load
duke
parents:
diff changeset
   501
  ResourceArea *area = Thread::current()->resource_area();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   502
  Node_List worklist_mem(area);     // prior memory state to store
489c9b5090e2 Initial load
duke
parents:
diff changeset
   503
  Node_List worklist_store(area);   // possible-def to explore
204
154149c3f7ba 6590177: jck60019 test assert(!repeated,"do not walk merges twice")
kvn
parents: 1
diff changeset
   504
  Node_List worklist_visited(area); // visited mergemem nodes
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   505
  Node_List non_early_stores(area); // all relevant stores outside of early
489c9b5090e2 Initial load
duke
parents:
diff changeset
   506
  bool must_raise_LCA = false;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   507
489c9b5090e2 Initial load
duke
parents:
diff changeset
   508
#ifdef TRACK_PHI_INPUTS
489c9b5090e2 Initial load
duke
parents:
diff changeset
   509
  // %%% This extra checking fails because MergeMem nodes are not GVNed.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   510
  // Provide "phi_inputs" to check if every input to a PhiNode is from the
489c9b5090e2 Initial load
duke
parents:
diff changeset
   511
  // original memory state.  This indicates a PhiNode for which should not
489c9b5090e2 Initial load
duke
parents:
diff changeset
   512
  // prevent the load from sinking.  For such a block, set_raise_LCA_mark
489c9b5090e2 Initial load
duke
parents:
diff changeset
   513
  // may be overly conservative.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   514
  // Mechanism: count inputs seen for each Phi encountered in worklist_store.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   515
  DEBUG_ONLY(GrowableArray<uint> phi_inputs(area, C->unique(),0,0));
489c9b5090e2 Initial load
duke
parents:
diff changeset
   516
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
   517
489c9b5090e2 Initial load
duke
parents:
diff changeset
   518
  // 'load' uses some memory state; look for users of the same state.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   519
  // Recurse through MergeMem nodes to the stores that use them.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   520
489c9b5090e2 Initial load
duke
parents:
diff changeset
   521
  // Each of these stores is a possible definition of memory
489c9b5090e2 Initial load
duke
parents:
diff changeset
   522
  // that 'load' needs to use.  We need to force 'load'
489c9b5090e2 Initial load
duke
parents:
diff changeset
   523
  // to occur before each such store.  When the store is in
489c9b5090e2 Initial load
duke
parents:
diff changeset
   524
  // the same block as 'load', we insert an anti-dependence
489c9b5090e2 Initial load
duke
parents:
diff changeset
   525
  // edge load->store.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   526
489c9b5090e2 Initial load
duke
parents:
diff changeset
   527
  // The relevant stores "nearby" the load consist of a tree rooted
489c9b5090e2 Initial load
duke
parents:
diff changeset
   528
  // at initial_mem, with internal nodes of type MergeMem.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   529
  // Therefore, the branches visited by the worklist are of this form:
489c9b5090e2 Initial load
duke
parents:
diff changeset
   530
  //    initial_mem -> (MergeMem ->)* store
489c9b5090e2 Initial load
duke
parents:
diff changeset
   531
  // The anti-dependence constraints apply only to the fringe of this tree.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   532
489c9b5090e2 Initial load
duke
parents:
diff changeset
   533
  Node* initial_mem = load->in(MemNode::Memory);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   534
  worklist_store.push(initial_mem);
204
154149c3f7ba 6590177: jck60019 test assert(!repeated,"do not walk merges twice")
kvn
parents: 1
diff changeset
   535
  worklist_visited.push(initial_mem);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   536
  worklist_mem.push(NULL);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   537
  while (worklist_store.size() > 0) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   538
    // Examine a nearby store to see if it might interfere with our load.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   539
    Node* mem   = worklist_mem.pop();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   540
    Node* store = worklist_store.pop();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   541
    uint op = store->Opcode();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   542
489c9b5090e2 Initial load
duke
parents:
diff changeset
   543
    // MergeMems do not directly have anti-deps.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   544
    // Treat them as internal nodes in a forward tree of memory states,
489c9b5090e2 Initial load
duke
parents:
diff changeset
   545
    // the leaves of which are each a 'possible-def'.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   546
    if (store == initial_mem    // root (exclusive) of tree we are searching
489c9b5090e2 Initial load
duke
parents:
diff changeset
   547
        || op == Op_MergeMem    // internal node of tree we are searching
489c9b5090e2 Initial load
duke
parents:
diff changeset
   548
        ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   549
      mem = store;   // It's not a possibly interfering store.
204
154149c3f7ba 6590177: jck60019 test assert(!repeated,"do not walk merges twice")
kvn
parents: 1
diff changeset
   550
      if (store == initial_mem)
154149c3f7ba 6590177: jck60019 test assert(!repeated,"do not walk merges twice")
kvn
parents: 1
diff changeset
   551
        initial_mem = NULL;  // only process initial memory once
154149c3f7ba 6590177: jck60019 test assert(!repeated,"do not walk merges twice")
kvn
parents: 1
diff changeset
   552
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   553
      for (DUIterator_Fast imax, i = mem->fast_outs(imax); i < imax; i++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   554
        store = mem->fast_out(i);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   555
        if (store->is_MergeMem()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   556
          // Be sure we don't get into combinatorial problems.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   557
          // (Allow phis to be repeated; they can merge two relevant states.)
204
154149c3f7ba 6590177: jck60019 test assert(!repeated,"do not walk merges twice")
kvn
parents: 1
diff changeset
   558
          uint j = worklist_visited.size();
154149c3f7ba 6590177: jck60019 test assert(!repeated,"do not walk merges twice")
kvn
parents: 1
diff changeset
   559
          for (; j > 0; j--) {
154149c3f7ba 6590177: jck60019 test assert(!repeated,"do not walk merges twice")
kvn
parents: 1
diff changeset
   560
            if (worklist_visited.at(j-1) == store)  break;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   561
          }
204
154149c3f7ba 6590177: jck60019 test assert(!repeated,"do not walk merges twice")
kvn
parents: 1
diff changeset
   562
          if (j > 0)  continue; // already on work list; do not repeat
154149c3f7ba 6590177: jck60019 test assert(!repeated,"do not walk merges twice")
kvn
parents: 1
diff changeset
   563
          worklist_visited.push(store);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   564
        }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   565
        worklist_mem.push(mem);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   566
        worklist_store.push(store);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   567
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   568
      continue;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   569
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   570
489c9b5090e2 Initial load
duke
parents:
diff changeset
   571
    if (op == Op_MachProj || op == Op_Catch)   continue;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   572
    if (store->needs_anti_dependence_check())  continue;  // not really a store
489c9b5090e2 Initial load
duke
parents:
diff changeset
   573
489c9b5090e2 Initial load
duke
parents:
diff changeset
   574
    // Compute the alias index.  Loads and stores with different alias
489c9b5090e2 Initial load
duke
parents:
diff changeset
   575
    // indices do not need anti-dependence edges.  Wide MemBar's are
489c9b5090e2 Initial load
duke
parents:
diff changeset
   576
    // anti-dependent on everything (except immutable memories).
489c9b5090e2 Initial load
duke
parents:
diff changeset
   577
    const TypePtr* adr_type = store->adr_type();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   578
    if (!C->can_alias(adr_type, load_alias_idx))  continue;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   579
489c9b5090e2 Initial load
duke
parents:
diff changeset
   580
    // Most slow-path runtime calls do NOT modify Java memory, but
489c9b5090e2 Initial load
duke
parents:
diff changeset
   581
    // they can block and so write Raw memory.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   582
    if (store->is_Mach()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   583
      MachNode* mstore = store->as_Mach();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   584
      if (load_alias_idx != Compile::AliasIdxRaw) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   585
        // Check for call into the runtime using the Java calling
489c9b5090e2 Initial load
duke
parents:
diff changeset
   586
        // convention (and from there into a wrapper); it has no
489c9b5090e2 Initial load
duke
parents:
diff changeset
   587
        // _method.  Can't do this optimization for Native calls because
489c9b5090e2 Initial load
duke
parents:
diff changeset
   588
        // they CAN write to Java memory.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   589
        if (mstore->ideal_Opcode() == Op_CallStaticJava) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   590
          assert(mstore->is_MachSafePoint(), "");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   591
          MachSafePointNode* ms = (MachSafePointNode*) mstore;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   592
          assert(ms->is_MachCallJava(), "");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   593
          MachCallJavaNode* mcj = (MachCallJavaNode*) ms;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   594
          if (mcj->_method == NULL) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   595
            // These runtime calls do not write to Java visible memory
489c9b5090e2 Initial load
duke
parents:
diff changeset
   596
            // (other than Raw) and so do not require anti-dependence edges.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   597
            continue;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   598
          }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   599
        }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   600
        // Same for SafePoints: they read/write Raw but only read otherwise.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   601
        // This is basically a workaround for SafePoints only defining control
489c9b5090e2 Initial load
duke
parents:
diff changeset
   602
        // instead of control + memory.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   603
        if (mstore->ideal_Opcode() == Op_SafePoint)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   604
          continue;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   605
      } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   606
        // Some raw memory, such as the load of "top" at an allocation,
489c9b5090e2 Initial load
duke
parents:
diff changeset
   607
        // can be control dependent on the previous safepoint. See
489c9b5090e2 Initial load
duke
parents:
diff changeset
   608
        // comments in GraphKit::allocate_heap() about control input.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   609
        // Inserting an anti-dep between such a safepoint and a use
489c9b5090e2 Initial load
duke
parents:
diff changeset
   610
        // creates a cycle, and will cause a subsequent failure in
489c9b5090e2 Initial load
duke
parents:
diff changeset
   611
        // local scheduling.  (BugId 4919904)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   612
        // (%%% How can a control input be a safepoint and not a projection??)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   613
        if (mstore->ideal_Opcode() == Op_SafePoint && load->in(0) == mstore)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   614
          continue;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   615
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   616
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   617
489c9b5090e2 Initial load
duke
parents:
diff changeset
   618
    // Identify a block that the current load must be above,
489c9b5090e2 Initial load
duke
parents:
diff changeset
   619
    // or else observe that 'store' is all the way up in the
489c9b5090e2 Initial load
duke
parents:
diff changeset
   620
    // earliest legal block for 'load'.  In the latter case,
489c9b5090e2 Initial load
duke
parents:
diff changeset
   621
    // immediately insert an anti-dependence edge.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   622
    Block* store_block = _bbs[store->_idx];
489c9b5090e2 Initial load
duke
parents:
diff changeset
   623
    assert(store_block != NULL, "unused killing projections skipped above");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   624
489c9b5090e2 Initial load
duke
parents:
diff changeset
   625
    if (store->is_Phi()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   626
      // 'load' uses memory which is one (or more) of the Phi's inputs.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   627
      // It must be scheduled not before the Phi, but rather before
489c9b5090e2 Initial load
duke
parents:
diff changeset
   628
      // each of the relevant Phi inputs.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   629
      //
489c9b5090e2 Initial load
duke
parents:
diff changeset
   630
      // Instead of finding the LCA of all inputs to a Phi that match 'mem',
489c9b5090e2 Initial load
duke
parents:
diff changeset
   631
      // we mark each corresponding predecessor block and do a combined
489c9b5090e2 Initial load
duke
parents:
diff changeset
   632
      // hoisting operation later (raise_LCA_above_marks).
489c9b5090e2 Initial load
duke
parents:
diff changeset
   633
      //
489c9b5090e2 Initial load
duke
parents:
diff changeset
   634
      // Do not assert(store_block != early, "Phi merging memory after access")
489c9b5090e2 Initial load
duke
parents:
diff changeset
   635
      // PhiNode may be at start of block 'early' with backedge to 'early'
489c9b5090e2 Initial load
duke
parents:
diff changeset
   636
      DEBUG_ONLY(bool found_match = false);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   637
      for (uint j = PhiNode::Input, jmax = store->req(); j < jmax; j++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   638
        if (store->in(j) == mem) {   // Found matching input?
489c9b5090e2 Initial load
duke
parents:
diff changeset
   639
          DEBUG_ONLY(found_match = true);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   640
          Block* pred_block = _bbs[store_block->pred(j)->_idx];
489c9b5090e2 Initial load
duke
parents:
diff changeset
   641
          if (pred_block != early) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   642
            // If any predecessor of the Phi matches the load's "early block",
489c9b5090e2 Initial load
duke
parents:
diff changeset
   643
            // we do not need a precedence edge between the Phi and 'load'
2131
98f9cef66a34 6810672: Comment typos
twisti
parents: 2127
diff changeset
   644
            // since the load will be forced into a block preceding the Phi.
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   645
            pred_block->set_raise_LCA_mark(load_index);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   646
            assert(!LCA_orig->dominates(pred_block) ||
489c9b5090e2 Initial load
duke
parents:
diff changeset
   647
                   early->dominates(pred_block), "early is high enough");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   648
            must_raise_LCA = true;
2875
549b4d80b29e 6843752: missing code for an anti-dependent Phi in GCM
kvn
parents: 2348
diff changeset
   649
          } else {
549b4d80b29e 6843752: missing code for an anti-dependent Phi in GCM
kvn
parents: 2348
diff changeset
   650
            // anti-dependent upon PHI pinned below 'early', no edge needed
549b4d80b29e 6843752: missing code for an anti-dependent Phi in GCM
kvn
parents: 2348
diff changeset
   651
            LCA = early;             // but can not schedule below 'early'
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   652
          }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   653
        }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   654
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   655
      assert(found_match, "no worklist bug");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   656
#ifdef TRACK_PHI_INPUTS
489c9b5090e2 Initial load
duke
parents:
diff changeset
   657
#ifdef ASSERT
489c9b5090e2 Initial load
duke
parents:
diff changeset
   658
      // This assert asks about correct handling of PhiNodes, which may not
489c9b5090e2 Initial load
duke
parents:
diff changeset
   659
      // have all input edges directly from 'mem'. See BugId 4621264
489c9b5090e2 Initial load
duke
parents:
diff changeset
   660
      int num_mem_inputs = phi_inputs.at_grow(store->_idx,0) + 1;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   661
      // Increment by exactly one even if there are multiple copies of 'mem'
489c9b5090e2 Initial load
duke
parents:
diff changeset
   662
      // coming into the phi, because we will run this block several times
489c9b5090e2 Initial load
duke
parents:
diff changeset
   663
      // if there are several copies of 'mem'.  (That's how DU iterators work.)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   664
      phi_inputs.at_put(store->_idx, num_mem_inputs);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   665
      assert(PhiNode::Input + num_mem_inputs < store->req(),
489c9b5090e2 Initial load
duke
parents:
diff changeset
   666
             "Expect at least one phi input will not be from original memory state");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   667
#endif //ASSERT
489c9b5090e2 Initial load
duke
parents:
diff changeset
   668
#endif //TRACK_PHI_INPUTS
489c9b5090e2 Initial load
duke
parents:
diff changeset
   669
    } else if (store_block != early) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   670
      // 'store' is between the current LCA and earliest possible block.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   671
      // Label its block, and decide later on how to raise the LCA
489c9b5090e2 Initial load
duke
parents:
diff changeset
   672
      // to include the effect on LCA of this store.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   673
      // If this store's block gets chosen as the raised LCA, we
489c9b5090e2 Initial load
duke
parents:
diff changeset
   674
      // will find him on the non_early_stores list and stick him
489c9b5090e2 Initial load
duke
parents:
diff changeset
   675
      // with a precedence edge.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   676
      // (But, don't bother if LCA is already raised all the way.)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   677
      if (LCA != early) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   678
        store_block->set_raise_LCA_mark(load_index);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   679
        must_raise_LCA = true;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   680
        non_early_stores.push(store);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   681
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   682
    } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   683
      // Found a possibly-interfering store in the load's 'early' block.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   684
      // This means 'load' cannot sink at all in the dominator tree.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   685
      // Add an anti-dep edge, and squeeze 'load' into the highest block.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   686
      assert(store != load->in(0), "dependence cycle found");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   687
      if (verify) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   688
        assert(store->find_edge(load) != -1, "missing precedence edge");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   689
      } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   690
        store->add_prec(load);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   691
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   692
      LCA = early;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   693
      // This turns off the process of gathering non_early_stores.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   694
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   695
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   696
  // (Worklist is now empty; all nearby stores have been visited.)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   697
489c9b5090e2 Initial load
duke
parents:
diff changeset
   698
  // Finished if 'load' must be scheduled in its 'early' block.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   699
  // If we found any stores there, they have already been given
489c9b5090e2 Initial load
duke
parents:
diff changeset
   700
  // precedence edges.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   701
  if (LCA == early)  return LCA;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   702
489c9b5090e2 Initial load
duke
parents:
diff changeset
   703
  // We get here only if there are no possibly-interfering stores
489c9b5090e2 Initial load
duke
parents:
diff changeset
   704
  // in the load's 'early' block.  Move LCA up above all predecessors
489c9b5090e2 Initial load
duke
parents:
diff changeset
   705
  // which contain stores we have noted.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   706
  //
489c9b5090e2 Initial load
duke
parents:
diff changeset
   707
  // The raised LCA block can be a home to such interfering stores,
489c9b5090e2 Initial load
duke
parents:
diff changeset
   708
  // but its predecessors must not contain any such stores.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   709
  //
489c9b5090e2 Initial load
duke
parents:
diff changeset
   710
  // The raised LCA will be a lower bound for placing the load,
489c9b5090e2 Initial load
duke
parents:
diff changeset
   711
  // preventing the load from sinking past any block containing
489c9b5090e2 Initial load
duke
parents:
diff changeset
   712
  // a store that may invalidate the memory state required by 'load'.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   713
  if (must_raise_LCA)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   714
    LCA = raise_LCA_above_marks(LCA, load->_idx, early, _bbs);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   715
  if (LCA == early)  return LCA;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   716
489c9b5090e2 Initial load
duke
parents:
diff changeset
   717
  // Insert anti-dependence edges from 'load' to each store
489c9b5090e2 Initial load
duke
parents:
diff changeset
   718
  // in the non-early LCA block.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   719
  // Mine the non_early_stores list for such stores.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   720
  if (LCA->raise_LCA_mark() == load_index) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   721
    while (non_early_stores.size() > 0) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   722
      Node* store = non_early_stores.pop();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   723
      Block* store_block = _bbs[store->_idx];
489c9b5090e2 Initial load
duke
parents:
diff changeset
   724
      if (store_block == LCA) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   725
        // add anti_dependence from store to load in its own block
489c9b5090e2 Initial load
duke
parents:
diff changeset
   726
        assert(store != load->in(0), "dependence cycle found");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   727
        if (verify) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   728
          assert(store->find_edge(load) != -1, "missing precedence edge");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   729
        } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   730
          store->add_prec(load);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   731
        }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   732
      } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   733
        assert(store_block->raise_LCA_mark() == load_index, "block was marked");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   734
        // Any other stores we found must be either inside the new LCA
489c9b5090e2 Initial load
duke
parents:
diff changeset
   735
        // or else outside the original LCA.  In the latter case, they
489c9b5090e2 Initial load
duke
parents:
diff changeset
   736
        // did not interfere with any use of 'load'.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   737
        assert(LCA->dominates(store_block)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   738
               || !LCA_orig->dominates(store_block), "no stray stores");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   739
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   740
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   741
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   742
489c9b5090e2 Initial load
duke
parents:
diff changeset
   743
  // Return the highest block containing stores; any stores
489c9b5090e2 Initial load
duke
parents:
diff changeset
   744
  // within that block have been given anti-dependence edges.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   745
  return LCA;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   746
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   747
489c9b5090e2 Initial load
duke
parents:
diff changeset
   748
// This class is used to iterate backwards over the nodes in the graph.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   749
489c9b5090e2 Initial load
duke
parents:
diff changeset
   750
class Node_Backward_Iterator {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   751
489c9b5090e2 Initial load
duke
parents:
diff changeset
   752
private:
489c9b5090e2 Initial load
duke
parents:
diff changeset
   753
  Node_Backward_Iterator();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   754
489c9b5090e2 Initial load
duke
parents:
diff changeset
   755
public:
489c9b5090e2 Initial load
duke
parents:
diff changeset
   756
  // Constructor for the iterator
489c9b5090e2 Initial load
duke
parents:
diff changeset
   757
  Node_Backward_Iterator(Node *root, VectorSet &visited, Node_List &stack, Block_Array &bbs);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   758
489c9b5090e2 Initial load
duke
parents:
diff changeset
   759
  // Postincrement operator to iterate over the nodes
489c9b5090e2 Initial load
duke
parents:
diff changeset
   760
  Node *next();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   761
489c9b5090e2 Initial load
duke
parents:
diff changeset
   762
private:
489c9b5090e2 Initial load
duke
parents:
diff changeset
   763
  VectorSet   &_visited;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   764
  Node_List   &_stack;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   765
  Block_Array &_bbs;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   766
};
489c9b5090e2 Initial load
duke
parents:
diff changeset
   767
489c9b5090e2 Initial load
duke
parents:
diff changeset
   768
// Constructor for the Node_Backward_Iterator
489c9b5090e2 Initial load
duke
parents:
diff changeset
   769
Node_Backward_Iterator::Node_Backward_Iterator( Node *root, VectorSet &visited, Node_List &stack, Block_Array &bbs )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   770
  : _visited(visited), _stack(stack), _bbs(bbs) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   771
  // The stack should contain exactly the root
489c9b5090e2 Initial load
duke
parents:
diff changeset
   772
  stack.clear();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   773
  stack.push(root);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   774
489c9b5090e2 Initial load
duke
parents:
diff changeset
   775
  // Clear the visited bits
489c9b5090e2 Initial load
duke
parents:
diff changeset
   776
  visited.Clear();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   777
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   778
489c9b5090e2 Initial load
duke
parents:
diff changeset
   779
// Iterator for the Node_Backward_Iterator
489c9b5090e2 Initial load
duke
parents:
diff changeset
   780
Node *Node_Backward_Iterator::next() {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   781
489c9b5090e2 Initial load
duke
parents:
diff changeset
   782
  // If the _stack is empty, then just return NULL: finished.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   783
  if ( !_stack.size() )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   784
    return NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   785
489c9b5090e2 Initial load
duke
parents:
diff changeset
   786
  // '_stack' is emulating a real _stack.  The 'visit-all-users' loop has been
489c9b5090e2 Initial load
duke
parents:
diff changeset
   787
  // made stateless, so I do not need to record the index 'i' on my _stack.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   788
  // Instead I visit all users each time, scanning for unvisited users.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   789
  // I visit unvisited not-anti-dependence users first, then anti-dependent
489c9b5090e2 Initial load
duke
parents:
diff changeset
   790
  // children next.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   791
  Node *self = _stack.pop();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   792
489c9b5090e2 Initial load
duke
parents:
diff changeset
   793
  // I cycle here when I am entering a deeper level of recursion.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   794
  // The key variable 'self' was set prior to jumping here.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   795
  while( 1 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   796
489c9b5090e2 Initial load
duke
parents:
diff changeset
   797
    _visited.set(self->_idx);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   798
489c9b5090e2 Initial load
duke
parents:
diff changeset
   799
    // Now schedule all uses as late as possible.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   800
    uint src     = self->is_Proj() ? self->in(0)->_idx : self->_idx;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   801
    uint src_rpo = _bbs[src]->_rpo;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   802
489c9b5090e2 Initial load
duke
parents:
diff changeset
   803
    // Schedule all nodes in a post-order visit
489c9b5090e2 Initial load
duke
parents:
diff changeset
   804
    Node *unvisited = NULL;  // Unvisited anti-dependent Node, if any
489c9b5090e2 Initial load
duke
parents:
diff changeset
   805
489c9b5090e2 Initial load
duke
parents:
diff changeset
   806
    // Scan for unvisited nodes
489c9b5090e2 Initial load
duke
parents:
diff changeset
   807
    for (DUIterator_Fast imax, i = self->fast_outs(imax); i < imax; i++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   808
      // For all uses, schedule late
489c9b5090e2 Initial load
duke
parents:
diff changeset
   809
      Node* n = self->fast_out(i); // Use
489c9b5090e2 Initial load
duke
parents:
diff changeset
   810
489c9b5090e2 Initial load
duke
parents:
diff changeset
   811
      // Skip already visited children
489c9b5090e2 Initial load
duke
parents:
diff changeset
   812
      if ( _visited.test(n->_idx) )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   813
        continue;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   814
489c9b5090e2 Initial load
duke
parents:
diff changeset
   815
      // do not traverse backward control edges
489c9b5090e2 Initial load
duke
parents:
diff changeset
   816
      Node *use = n->is_Proj() ? n->in(0) : n;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   817
      uint use_rpo = _bbs[use->_idx]->_rpo;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   818
489c9b5090e2 Initial load
duke
parents:
diff changeset
   819
      if ( use_rpo < src_rpo )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   820
        continue;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   821
489c9b5090e2 Initial load
duke
parents:
diff changeset
   822
      // Phi nodes always precede uses in a basic block
489c9b5090e2 Initial load
duke
parents:
diff changeset
   823
      if ( use_rpo == src_rpo && use->is_Phi() )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   824
        continue;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   825
489c9b5090e2 Initial load
duke
parents:
diff changeset
   826
      unvisited = n;      // Found unvisited
489c9b5090e2 Initial load
duke
parents:
diff changeset
   827
489c9b5090e2 Initial load
duke
parents:
diff changeset
   828
      // Check for possible-anti-dependent
489c9b5090e2 Initial load
duke
parents:
diff changeset
   829
      if( !n->needs_anti_dependence_check() )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   830
        break;            // Not visited, not anti-dep; schedule it NOW
489c9b5090e2 Initial load
duke
parents:
diff changeset
   831
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   832
489c9b5090e2 Initial load
duke
parents:
diff changeset
   833
    // Did I find an unvisited not-anti-dependent Node?
489c9b5090e2 Initial load
duke
parents:
diff changeset
   834
    if ( !unvisited )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   835
      break;                  // All done with children; post-visit 'self'
489c9b5090e2 Initial load
duke
parents:
diff changeset
   836
489c9b5090e2 Initial load
duke
parents:
diff changeset
   837
    // Visit the unvisited Node.  Contains the obvious push to
489c9b5090e2 Initial load
duke
parents:
diff changeset
   838
    // indicate I'm entering a deeper level of recursion.  I push the
489c9b5090e2 Initial load
duke
parents:
diff changeset
   839
    // old state onto the _stack and set a new state and loop (recurse).
489c9b5090e2 Initial load
duke
parents:
diff changeset
   840
    _stack.push(self);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   841
    self = unvisited;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   842
  } // End recursion loop
489c9b5090e2 Initial load
duke
parents:
diff changeset
   843
489c9b5090e2 Initial load
duke
parents:
diff changeset
   844
  return self;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   845
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   846
489c9b5090e2 Initial load
duke
parents:
diff changeset
   847
//------------------------------ComputeLatenciesBackwards----------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   848
// Compute the latency of all the instructions.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   849
void PhaseCFG::ComputeLatenciesBackwards(VectorSet &visited, Node_List &stack) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   850
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
   851
  if (trace_opto_pipelining())
489c9b5090e2 Initial load
duke
parents:
diff changeset
   852
    tty->print("\n#---- ComputeLatenciesBackwards ----\n");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   853
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
   854
489c9b5090e2 Initial load
duke
parents:
diff changeset
   855
  Node_Backward_Iterator iter((Node *)_root, visited, stack, _bbs);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   856
  Node *n;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   857
489c9b5090e2 Initial load
duke
parents:
diff changeset
   858
  // Walk over all the nodes from last to first
489c9b5090e2 Initial load
duke
parents:
diff changeset
   859
  while (n = iter.next()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   860
    // Set the latency for the definitions of this instruction
489c9b5090e2 Initial load
duke
parents:
diff changeset
   861
    partial_latency_of_defs(n);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   862
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   863
} // end ComputeLatenciesBackwards
489c9b5090e2 Initial load
duke
parents:
diff changeset
   864
489c9b5090e2 Initial load
duke
parents:
diff changeset
   865
//------------------------------partial_latency_of_defs------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   866
// Compute the latency impact of this node on all defs.  This computes
489c9b5090e2 Initial load
duke
parents:
diff changeset
   867
// a number that increases as we approach the beginning of the routine.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   868
void PhaseCFG::partial_latency_of_defs(Node *n) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   869
  // Set the latency for this instruction
489c9b5090e2 Initial load
duke
parents:
diff changeset
   870
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
   871
  if (trace_opto_pipelining()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   872
    tty->print("# latency_to_inputs: node_latency[%d] = %d for node",
6180
53c1bf468c81 6973963: SEGV in ciBlock::start_bci() with EA
kvn
parents: 5547
diff changeset
   873
               n->_idx, _node_latency->at_grow(n->_idx));
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   874
    dump();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   875
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   876
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
   877
489c9b5090e2 Initial load
duke
parents:
diff changeset
   878
  if (n->is_Proj())
489c9b5090e2 Initial load
duke
parents:
diff changeset
   879
    n = n->in(0);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   880
489c9b5090e2 Initial load
duke
parents:
diff changeset
   881
  if (n->is_Root())
489c9b5090e2 Initial load
duke
parents:
diff changeset
   882
    return;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   883
489c9b5090e2 Initial load
duke
parents:
diff changeset
   884
  uint nlen = n->len();
6180
53c1bf468c81 6973963: SEGV in ciBlock::start_bci() with EA
kvn
parents: 5547
diff changeset
   885
  uint use_latency = _node_latency->at_grow(n->_idx);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   886
  uint use_pre_order = _bbs[n->_idx]->_pre_order;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   887
489c9b5090e2 Initial load
duke
parents:
diff changeset
   888
  for ( uint j=0; j<nlen; j++ ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   889
    Node *def = n->in(j);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   890
489c9b5090e2 Initial load
duke
parents:
diff changeset
   891
    if (!def || def == n)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   892
      continue;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   893
489c9b5090e2 Initial load
duke
parents:
diff changeset
   894
    // Walk backwards thru projections
489c9b5090e2 Initial load
duke
parents:
diff changeset
   895
    if (def->is_Proj())
489c9b5090e2 Initial load
duke
parents:
diff changeset
   896
      def = def->in(0);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   897
489c9b5090e2 Initial load
duke
parents:
diff changeset
   898
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
   899
    if (trace_opto_pipelining()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   900
      tty->print("#    in(%2d): ", j);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   901
      def->dump();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   902
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   903
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
   904
489c9b5090e2 Initial load
duke
parents:
diff changeset
   905
    // If the defining block is not known, assume it is ok
489c9b5090e2 Initial load
duke
parents:
diff changeset
   906
    Block *def_block = _bbs[def->_idx];
489c9b5090e2 Initial load
duke
parents:
diff changeset
   907
    uint def_pre_order = def_block ? def_block->_pre_order : 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   908
489c9b5090e2 Initial load
duke
parents:
diff changeset
   909
    if ( (use_pre_order <  def_pre_order) ||
489c9b5090e2 Initial load
duke
parents:
diff changeset
   910
         (use_pre_order == def_pre_order && n->is_Phi()) )
489c9b5090e2 Initial load
duke
parents:
diff changeset
   911
      continue;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   912
489c9b5090e2 Initial load
duke
parents:
diff changeset
   913
    uint delta_latency = n->latency(j);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   914
    uint current_latency = delta_latency + use_latency;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   915
6180
53c1bf468c81 6973963: SEGV in ciBlock::start_bci() with EA
kvn
parents: 5547
diff changeset
   916
    if (_node_latency->at_grow(def->_idx) < current_latency) {
53c1bf468c81 6973963: SEGV in ciBlock::start_bci() with EA
kvn
parents: 5547
diff changeset
   917
      _node_latency->at_put_grow(def->_idx, current_latency);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   918
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   919
489c9b5090e2 Initial load
duke
parents:
diff changeset
   920
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
   921
    if (trace_opto_pipelining()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   922
      tty->print_cr("#      %d + edge_latency(%d) == %d -> %d, node_latency[%d] = %d",
489c9b5090e2 Initial load
duke
parents:
diff changeset
   923
                    use_latency, j, delta_latency, current_latency, def->_idx,
6180
53c1bf468c81 6973963: SEGV in ciBlock::start_bci() with EA
kvn
parents: 5547
diff changeset
   924
                    _node_latency->at_grow(def->_idx));
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   925
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   926
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
   927
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   928
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   929
489c9b5090e2 Initial load
duke
parents:
diff changeset
   930
//------------------------------latency_from_use-------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   931
// Compute the latency of a specific use
489c9b5090e2 Initial load
duke
parents:
diff changeset
   932
int PhaseCFG::latency_from_use(Node *n, const Node *def, Node *use) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   933
  // If self-reference, return no latency
489c9b5090e2 Initial load
duke
parents:
diff changeset
   934
  if (use == n || use->is_Root())
489c9b5090e2 Initial load
duke
parents:
diff changeset
   935
    return 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   936
489c9b5090e2 Initial load
duke
parents:
diff changeset
   937
  uint def_pre_order = _bbs[def->_idx]->_pre_order;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   938
  uint latency = 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   939
489c9b5090e2 Initial load
duke
parents:
diff changeset
   940
  // If the use is not a projection, then it is simple...
489c9b5090e2 Initial load
duke
parents:
diff changeset
   941
  if (!use->is_Proj()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   942
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
   943
    if (trace_opto_pipelining()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   944
      tty->print("#    out(): ");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   945
      use->dump();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   946
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   947
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
   948
489c9b5090e2 Initial load
duke
parents:
diff changeset
   949
    uint use_pre_order = _bbs[use->_idx]->_pre_order;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   950
489c9b5090e2 Initial load
duke
parents:
diff changeset
   951
    if (use_pre_order < def_pre_order)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   952
      return 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   953
489c9b5090e2 Initial load
duke
parents:
diff changeset
   954
    if (use_pre_order == def_pre_order && use->is_Phi())
489c9b5090e2 Initial load
duke
parents:
diff changeset
   955
      return 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   956
489c9b5090e2 Initial load
duke
parents:
diff changeset
   957
    uint nlen = use->len();
6180
53c1bf468c81 6973963: SEGV in ciBlock::start_bci() with EA
kvn
parents: 5547
diff changeset
   958
    uint nl = _node_latency->at_grow(use->_idx);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   959
489c9b5090e2 Initial load
duke
parents:
diff changeset
   960
    for ( uint j=0; j<nlen; j++ ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   961
      if (use->in(j) == n) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   962
        // Change this if we want local latencies
489c9b5090e2 Initial load
duke
parents:
diff changeset
   963
        uint ul = use->latency(j);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   964
        uint  l = ul + nl;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   965
        if (latency < l) latency = l;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   966
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
   967
        if (trace_opto_pipelining()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   968
          tty->print_cr("#      %d + edge_latency(%d) == %d -> %d, latency = %d",
489c9b5090e2 Initial load
duke
parents:
diff changeset
   969
                        nl, j, ul, l, latency);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   970
        }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   971
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
   972
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   973
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   974
  } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   975
    // This is a projection, just grab the latency of the use(s)
489c9b5090e2 Initial load
duke
parents:
diff changeset
   976
    for (DUIterator_Fast jmax, j = use->fast_outs(jmax); j < jmax; j++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   977
      uint l = latency_from_use(use, def, use->fast_out(j));
489c9b5090e2 Initial load
duke
parents:
diff changeset
   978
      if (latency < l) latency = l;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   979
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   980
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   981
489c9b5090e2 Initial load
duke
parents:
diff changeset
   982
  return latency;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   983
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   984
489c9b5090e2 Initial load
duke
parents:
diff changeset
   985
//------------------------------latency_from_uses------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
   986
// Compute the latency of this instruction relative to all of it's uses.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   987
// This computes a number that increases as we approach the beginning of the
489c9b5090e2 Initial load
duke
parents:
diff changeset
   988
// routine.
489c9b5090e2 Initial load
duke
parents:
diff changeset
   989
void PhaseCFG::latency_from_uses(Node *n) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   990
  // Set the latency for this instruction
489c9b5090e2 Initial load
duke
parents:
diff changeset
   991
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
   992
  if (trace_opto_pipelining()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   993
    tty->print("# latency_from_outputs: node_latency[%d] = %d for node",
6180
53c1bf468c81 6973963: SEGV in ciBlock::start_bci() with EA
kvn
parents: 5547
diff changeset
   994
               n->_idx, _node_latency->at_grow(n->_idx));
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   995
    dump();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   996
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   997
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
   998
  uint latency=0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   999
  const Node *def = n->is_Proj() ? n->in(0): n;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1000
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1001
  for (DUIterator_Fast imax, i = n->fast_outs(imax); i < imax; i++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1002
    uint l = latency_from_use(n, def, n->fast_out(i));
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1003
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1004
    if (latency < l) latency = l;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1005
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1006
6180
53c1bf468c81 6973963: SEGV in ciBlock::start_bci() with EA
kvn
parents: 5547
diff changeset
  1007
  _node_latency->at_put_grow(n->_idx, latency);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1008
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1009
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1010
//------------------------------hoist_to_cheaper_block-------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1011
// Pick a block for node self, between early and LCA, that is a cheaper
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1012
// alternative to LCA.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1013
Block* PhaseCFG::hoist_to_cheaper_block(Block* LCA, Block* early, Node* self) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1014
  const double delta = 1+PROB_UNLIKELY_MAG(4);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1015
  Block* least       = LCA;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1016
  double least_freq  = least->_freq;
6180
53c1bf468c81 6973963: SEGV in ciBlock::start_bci() with EA
kvn
parents: 5547
diff changeset
  1017
  uint target        = _node_latency->at_grow(self->_idx);
53c1bf468c81 6973963: SEGV in ciBlock::start_bci() with EA
kvn
parents: 5547
diff changeset
  1018
  uint start_latency = _node_latency->at_grow(LCA->_nodes[0]->_idx);
53c1bf468c81 6973963: SEGV in ciBlock::start_bci() with EA
kvn
parents: 5547
diff changeset
  1019
  uint end_latency   = _node_latency->at_grow(LCA->_nodes[LCA->end_idx()]->_idx);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1020
  bool in_latency    = (target <= start_latency);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1021
  const Block* root_block = _bbs[_root->_idx];
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1022
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1023
  // Turn off latency scheduling if scheduling is just plain off
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1024
  if (!C->do_scheduling())
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1025
    in_latency = true;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1026
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1027
  // Do not hoist (to cover latency) instructions which target a
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1028
  // single register.  Hoisting stretches the live range of the
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1029
  // single register and may force spilling.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1030
  MachNode* mach = self->is_Mach() ? self->as_Mach() : NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1031
  if (mach && mach->out_RegMask().is_bound1() && mach->out_RegMask().is_NotEmpty())
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1032
    in_latency = true;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1033
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1034
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1035
  if (trace_opto_pipelining()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1036
    tty->print("# Find cheaper block for latency %d: ",
6180
53c1bf468c81 6973963: SEGV in ciBlock::start_bci() with EA
kvn
parents: 5547
diff changeset
  1037
      _node_latency->at_grow(self->_idx));
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1038
    self->dump();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1039
    tty->print_cr("#   B%d: start latency for [%4d]=%d, end latency for [%4d]=%d, freq=%g",
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1040
      LCA->_pre_order,
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1041
      LCA->_nodes[0]->_idx,
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1042
      start_latency,
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1043
      LCA->_nodes[LCA->end_idx()]->_idx,
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1044
      end_latency,
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1045
      least_freq);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1046
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1047
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1048
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1049
  // Walk up the dominator tree from LCA (Lowest common ancestor) to
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1050
  // the earliest legal location.  Capture the least execution frequency.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1051
  while (LCA != early) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1052
    LCA = LCA->_idom;         // Follow up the dominator tree
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1053
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1054
    if (LCA == NULL) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1055
      // Bailout without retry
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1056
      C->record_method_not_compilable("late schedule failed: LCA == NULL");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1057
      return least;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1058
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1059
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1060
    // Don't hoist machine instructions to the root basic block
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1061
    if (mach && LCA == root_block)
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1062
      break;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1063
6180
53c1bf468c81 6973963: SEGV in ciBlock::start_bci() with EA
kvn
parents: 5547
diff changeset
  1064
    uint start_lat = _node_latency->at_grow(LCA->_nodes[0]->_idx);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1065
    uint end_idx   = LCA->end_idx();
6180
53c1bf468c81 6973963: SEGV in ciBlock::start_bci() with EA
kvn
parents: 5547
diff changeset
  1066
    uint end_lat   = _node_latency->at_grow(LCA->_nodes[end_idx]->_idx);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1067
    double LCA_freq = LCA->_freq;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1068
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1069
    if (trace_opto_pipelining()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1070
      tty->print_cr("#   B%d: start latency for [%4d]=%d, end latency for [%4d]=%d, freq=%g",
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1071
        LCA->_pre_order, LCA->_nodes[0]->_idx, start_lat, end_idx, end_lat, LCA_freq);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1072
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1073
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1074
    if (LCA_freq < least_freq              || // Better Frequency
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1075
        ( !in_latency                   &&    // No block containing latency
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1076
          LCA_freq < least_freq * delta &&    // No worse frequency
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1077
          target >= end_lat             &&    // within latency range
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1078
          !self->is_iteratively_computed() )  // But don't hoist IV increments
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1079
             // because they may end up above other uses of their phi forcing
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1080
             // their result register to be different from their input.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1081
       ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1082
      least = LCA;            // Found cheaper block
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1083
      least_freq = LCA_freq;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1084
      start_latency = start_lat;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1085
      end_latency = end_lat;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1086
      if (target <= start_lat)
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1087
        in_latency = true;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1088
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1089
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1090
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1091
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1092
  if (trace_opto_pipelining()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1093
    tty->print_cr("#  Choose block B%d with start latency=%d and freq=%g",
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1094
      least->_pre_order, start_latency, least_freq);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1095
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1096
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1097
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1098
  // See if the latency needs to be updated
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1099
  if (target < end_latency) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1100
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1101
    if (trace_opto_pipelining()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1102
      tty->print_cr("#  Change latency for [%4d] from %d to %d", self->_idx, target, end_latency);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1103
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1104
#endif
6180
53c1bf468c81 6973963: SEGV in ciBlock::start_bci() with EA
kvn
parents: 5547
diff changeset
  1105
    _node_latency->at_put_grow(self->_idx, end_latency);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1106
    partial_latency_of_defs(self);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1107
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1108
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1109
  return least;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1110
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1111
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1112
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1113
//------------------------------schedule_late-----------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1114
// Now schedule all codes as LATE as possible.  This is the LCA in the
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1115
// dominator tree of all USES of a value.  Pick the block with the least
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1116
// loop nesting depth that is lowest in the dominator tree.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1117
extern const char must_clone[];
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1118
void PhaseCFG::schedule_late(VectorSet &visited, Node_List &stack) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1119
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1120
  if (trace_opto_pipelining())
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1121
    tty->print("\n#---- schedule_late ----\n");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1122
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1123
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1124
  Node_Backward_Iterator iter((Node *)_root, visited, stack, _bbs);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1125
  Node *self;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1126
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1127
  // Walk over all the nodes from last to first
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1128
  while (self = iter.next()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1129
    Block* early = _bbs[self->_idx];   // Earliest legal placement
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1130
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1131
    if (self->is_top()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1132
      // Top node goes in bb #2 with other constants.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1133
      // It must be special-cased, because it has no out edges.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1134
      early->add_inst(self);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1135
      continue;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1136
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1137
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1138
    // No uses, just terminate
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1139
    if (self->outcnt() == 0) {
10255
bab46e6f7661 7069452: Cleanup NodeFlags
kvn
parents: 8921
diff changeset
  1140
      assert(self->is_MachProj(), "sanity");
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1141
      continue;                   // Must be a dead machine projection
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1142
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1143
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1144
    // If node is pinned in the block, then no scheduling can be done.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1145
    if( self->pinned() )          // Pinned in block?
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1146
      continue;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1147
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1148
    MachNode* mach = self->is_Mach() ? self->as_Mach() : NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1149
    if (mach) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1150
      switch (mach->ideal_Opcode()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1151
      case Op_CreateEx:
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1152
        // Don't move exception creation
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1153
        early->add_inst(self);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1154
        continue;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1155
        break;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1156
      case Op_CheckCastPP:
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1157
        // Don't move CheckCastPP nodes away from their input, if the input
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1158
        // is a rawptr (5071820).
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1159
        Node *def = self->in(1);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1160
        if (def != NULL && def->bottom_type()->base() == Type::RawPtr) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1161
          early->add_inst(self);
3186
11ba3d09bd0e 6840775: Multiple JVM crashes seen with 1.6.0_10 through 1.6.0_14
kvn
parents: 2875
diff changeset
  1162
#ifdef ASSERT
11ba3d09bd0e 6840775: Multiple JVM crashes seen with 1.6.0_10 through 1.6.0_14
kvn
parents: 2875
diff changeset
  1163
          _raw_oops.push(def);
11ba3d09bd0e 6840775: Multiple JVM crashes seen with 1.6.0_10 through 1.6.0_14
kvn
parents: 2875
diff changeset
  1164
#endif
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1165
          continue;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1166
        }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1167
        break;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1168
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1169
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1170
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1171
    // Gather LCA of all uses
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1172
    Block *LCA = NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1173
    {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1174
      for (DUIterator_Fast imax, i = self->fast_outs(imax); i < imax; i++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1175
        // For all uses, find LCA
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1176
        Node* use = self->fast_out(i);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1177
        LCA = raise_LCA_above_use(LCA, use, self, _bbs);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1178
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1179
    }  // (Hide defs of imax, i from rest of block.)
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1180
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1181
    // Place temps in the block of their use.  This isn't a
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1182
    // requirement for correctness but it reduces useless
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1183
    // interference between temps and other nodes.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1184
    if (mach != NULL && mach->is_MachTemp()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1185
      _bbs.map(self->_idx, LCA);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1186
      LCA->add_inst(self);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1187
      continue;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1188
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1189
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1190
    // Check if 'self' could be anti-dependent on memory
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1191
    if (self->needs_anti_dependence_check()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1192
      // Hoist LCA above possible-defs and insert anti-dependences to
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1193
      // defs in new LCA block.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1194
      LCA = insert_anti_dependences(LCA, self);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1195
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1196
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1197
    if (early->_dom_depth > LCA->_dom_depth) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1198
      // Somehow the LCA has moved above the earliest legal point.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1199
      // (One way this can happen is via memory_early_block.)
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1200
      if (C->subsume_loads() == true && !C->failing()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1201
        // Retry with subsume_loads == false
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1202
        // If this is the first failure, the sentinel string will "stick"
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1203
        // to the Compile object, and the C2Compiler will see it and retry.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1204
        C->record_failure(C2Compiler::retry_no_subsuming_loads());
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1205
      } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1206
        // Bailout without retry when (early->_dom_depth > LCA->_dom_depth)
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1207
        C->record_method_not_compilable("late schedule failed: incorrect graph");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1208
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1209
      return;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1210
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1211
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1212
    // If there is no opportunity to hoist, then we're done.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1213
    bool try_to_hoist = (LCA != early);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1214
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1215
    // Must clone guys stay next to use; no hoisting allowed.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1216
    // Also cannot hoist guys that alter memory or are otherwise not
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1217
    // allocatable (hoisting can make a value live longer, leading to
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1218
    // anti and output dependency problems which are normally resolved
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1219
    // by the register allocator giving everyone a different register).
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1220
    if (mach != NULL && must_clone[mach->ideal_Opcode()])
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1221
      try_to_hoist = false;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1222
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1223
    Block* late = NULL;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1224
    if (try_to_hoist) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1225
      // Now find the block with the least execution frequency.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1226
      // Start at the latest schedule and work up to the earliest schedule
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1227
      // in the dominator tree.  Thus the Node will dominate all its uses.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1228
      late = hoist_to_cheaper_block(LCA, early, self);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1229
    } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1230
      // Just use the LCA of the uses.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1231
      late = LCA;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1232
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1233
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1234
    // Put the node into target block
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1235
    schedule_node_into_block(self, late);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1236
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1237
#ifdef ASSERT
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1238
    if (self->needs_anti_dependence_check()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1239
      // since precedence edges are only inserted when we're sure they
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1240
      // are needed make sure that after placement in a block we don't
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1241
      // need any new precedence edges.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1242
      verify_anti_dependences(late, self);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1243
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1244
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1245
  } // Loop until all nodes have been visited
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1246
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1247
} // end ScheduleLate
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1248
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1249
//------------------------------GlobalCodeMotion-------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1250
void PhaseCFG::GlobalCodeMotion( Matcher &matcher, uint unique, Node_List &proj_list ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1251
  ResourceMark rm;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1252
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1253
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1254
  if (trace_opto_pipelining()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1255
    tty->print("\n---- Start GlobalCodeMotion ----\n");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1256
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1257
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1258
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1259
  // Initialize the bbs.map for things on the proj_list
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1260
  uint i;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1261
  for( i=0; i < proj_list.size(); i++ )
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1262
    _bbs.map(proj_list[i]->_idx, NULL);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1263
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1264
  // Set the basic block for Nodes pinned into blocks
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1265
  Arena *a = Thread::current()->resource_area();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1266
  VectorSet visited(a);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1267
  schedule_pinned_nodes( visited );
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1268
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1269
  // Find the earliest Block any instruction can be placed in.  Some
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1270
  // instructions are pinned into Blocks.  Unpinned instructions can
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1271
  // appear in last block in which all their inputs occur.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1272
  visited.Clear();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1273
  Node_List stack(a);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1274
  stack.map( (unique >> 1) + 16, NULL); // Pre-grow the list
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1275
  if (!schedule_early(visited, stack)) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1276
    // Bailout without retry
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1277
    C->record_method_not_compilable("early schedule failed");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1278
    return;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1279
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1280
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1281
  // Build Def-Use edges.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1282
  proj_list.push(_root);        // Add real root as another root
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1283
  proj_list.pop();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1284
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1285
  // Compute the latency information (via backwards walk) for all the
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1286
  // instructions in the graph
6180
53c1bf468c81 6973963: SEGV in ciBlock::start_bci() with EA
kvn
parents: 5547
diff changeset
  1287
  _node_latency = new GrowableArray<uint>(); // resource_area allocation
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1288
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1289
  if( C->do_scheduling() )
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1290
    ComputeLatenciesBackwards(visited, stack);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1291
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1292
  // Now schedule all codes as LATE as possible.  This is the LCA in the
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1293
  // dominator tree of all USES of a value.  Pick the block with the least
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1294
  // loop nesting depth that is lowest in the dominator tree.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1295
  // ( visited.Clear() called in schedule_late()->Node_Backward_Iterator() )
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1296
  schedule_late(visited, stack);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1297
  if( C->failing() ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1298
    // schedule_late fails only when graph is incorrect.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1299
    assert(!VerifyGraphEdges, "verification should have failed");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1300
    return;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1301
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1302
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1303
  unique = C->unique();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1304
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1305
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1306
  if (trace_opto_pipelining()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1307
    tty->print("\n---- Detect implicit null checks ----\n");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1308
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1309
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1310
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1311
  // Detect implicit-null-check opportunities.  Basically, find NULL checks
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1312
  // with suitable memory ops nearby.  Use the memory op to do the NULL check.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1313
  // I can generate a memory op if there is not one nearby.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1314
  if (C->is_method_compilation()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1315
    // Don't do it for natives, adapters, or runtime stubs
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1316
    int allowed_reasons = 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1317
    // ...and don't do it when there have been too many traps, globally.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1318
    for (int reason = (int)Deoptimization::Reason_none+1;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1319
         reason < Compile::trapHistLength; reason++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1320
      assert(reason < BitsPerInt, "recode bit map");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1321
      if (!C->too_many_traps((Deoptimization::DeoptReason) reason))
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1322
        allowed_reasons |= nth_bit(reason);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1323
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1324
    // By reversing the loop direction we get a very minor gain on mpegaudio.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1325
    // Feel free to revert to a forward loop for clarity.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1326
    // for( int i=0; i < (int)matcher._null_check_tests.size(); i+=2 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1327
    for( int i= matcher._null_check_tests.size()-2; i>=0; i-=2 ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1328
      Node *proj = matcher._null_check_tests[i  ];
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1329
      Node *val  = matcher._null_check_tests[i+1];
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1330
      _bbs[proj->_idx]->implicit_null_check(this, proj, val, allowed_reasons);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1331
      // The implicit_null_check will only perform the transformation
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1332
      // if the null branch is truly uncommon, *and* it leads to an
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1333
      // uncommon trap.  Combined with the too_many_traps guards
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1334
      // above, this prevents SEGV storms reported in 6366351,
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1335
      // by recompiling offending methods without this optimization.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1336
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1337
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1338
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1339
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1340
  if (trace_opto_pipelining()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1341
    tty->print("\n---- Start Local Scheduling ----\n");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1342
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1343
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1344
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1345
  // Schedule locally.  Right now a simple topological sort.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1346
  // Later, do a real latency aware scheduler.
11567
512b2c76e3b7 7116050: C2/ARM: memory stomping error with DivideMcTests
roland
parents: 11191
diff changeset
  1347
  uint max_idx = C->unique();
512b2c76e3b7 7116050: C2/ARM: memory stomping error with DivideMcTests
roland
parents: 11191
diff changeset
  1348
  GrowableArray<int> ready_cnt(max_idx, max_idx, -1);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1349
  visited.Clear();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1350
  for (i = 0; i < _num_blocks; i++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1351
    if (!_blocks[i]->schedule_local(this, matcher, ready_cnt, visited)) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1352
      if (!C->failure_reason_is(C2Compiler::retry_no_subsuming_loads())) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1353
        C->record_method_not_compilable("local schedule failed");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1354
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1355
      return;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1356
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1357
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1358
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1359
  // If we inserted any instructions between a Call and his CatchNode,
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1360
  // clone the instructions on all paths below the Catch.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1361
  for( i=0; i < _num_blocks; i++ )
14623
70c4c1be0a14 7092905: C2: Keep track of the number of dead nodes
bharadwaj
parents: 13963
diff changeset
  1362
    _blocks[i]->call_catch_cleanup(_bbs, C);
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1363
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1364
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1365
  if (trace_opto_pipelining()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1366
    tty->print("\n---- After GlobalCodeMotion ----\n");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1367
    for (uint i = 0; i < _num_blocks; i++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1368
      _blocks[i]->dump();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1369
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1370
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1371
#endif
6180
53c1bf468c81 6973963: SEGV in ciBlock::start_bci() with EA
kvn
parents: 5547
diff changeset
  1372
  // Dead.
53c1bf468c81 6973963: SEGV in ciBlock::start_bci() with EA
kvn
parents: 5547
diff changeset
  1373
  _node_latency = (GrowableArray<uint> *)0xdeadbeef;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1374
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1375
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1376
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1377
//------------------------------Estimate_Block_Frequency-----------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1378
// Estimate block frequencies based on IfNode probabilities.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1379
void PhaseCFG::Estimate_Block_Frequency() {
1498
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1380
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1381
  // Force conditional branches leading to uncommon traps to be unlikely,
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1382
  // not because we get to the uncommon_trap with less relative frequency,
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1383
  // but because an uncommon_trap typically causes a deopt, so we only get
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1384
  // there once.
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1385
  if (C->do_freq_based_layout()) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1386
    Block_List worklist;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1387
    Block* root_blk = _blocks[0];
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1388
    for (uint i = 1; i < root_blk->num_preds(); i++) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1389
      Block *pb = _bbs[root_blk->pred(i)->_idx];
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1390
      if (pb->has_uncommon_code()) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1391
        worklist.push(pb);
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1392
      }
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1393
    }
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1394
    while (worklist.size() > 0) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1395
      Block* uct = worklist.pop();
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1396
      if (uct == _broot) continue;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1397
      for (uint i = 1; i < uct->num_preds(); i++) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1398
        Block *pb = _bbs[uct->pred(i)->_idx];
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1399
        if (pb->_num_succs == 1) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1400
          worklist.push(pb);
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1401
        } else if (pb->num_fall_throughs() == 2) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1402
          pb->update_uncommon_branch(uct);
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1403
        }
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1404
      }
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1405
    }
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1406
  }
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1407
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1408
  // Create the loop tree and calculate loop depth.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1409
  _root_loop = create_loop_tree();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1410
  _root_loop->compute_loop_depth(0);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1411
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1412
  // Compute block frequency of each block, relative to a single loop entry.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1413
  _root_loop->compute_freq();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1414
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1415
  // Adjust all frequencies to be relative to a single method entry
1498
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1416
  _root_loop->_freq = 1.0;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1417
  _root_loop->scale_freq();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1418
2340
cb47f8209cd8 6810845: Performance regression in mpegaudio on x64
kvn
parents: 2154
diff changeset
  1419
  // Save outmost loop frequency for LRG frequency threshold
cb47f8209cd8 6810845: Performance regression in mpegaudio on x64
kvn
parents: 2154
diff changeset
  1420
  _outer_loop_freq = _root_loop->outer_loop_freq();
cb47f8209cd8 6810845: Performance regression in mpegaudio on x64
kvn
parents: 2154
diff changeset
  1421
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1422
  // force paths ending at uncommon traps to be infrequent
1498
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1423
  if (!C->do_freq_based_layout()) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1424
    Block_List worklist;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1425
    Block* root_blk = _blocks[0];
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1426
    for (uint i = 1; i < root_blk->num_preds(); i++) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1427
      Block *pb = _bbs[root_blk->pred(i)->_idx];
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1428
      if (pb->has_uncommon_code()) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1429
        worklist.push(pb);
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1430
      }
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1431
    }
1498
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1432
    while (worklist.size() > 0) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1433
      Block* uct = worklist.pop();
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1434
      uct->_freq = PROB_MIN;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1435
      for (uint i = 1; i < uct->num_preds(); i++) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1436
        Block *pb = _bbs[uct->pred(i)->_idx];
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1437
        if (pb->_num_succs == 1 && pb->_freq > PROB_MIN) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1438
          worklist.push(pb);
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1439
        }
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1440
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1441
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1442
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1443
2016
c1f73fa547fe 6784930: server jvm fails with assert(!n->is_SpillCopy(),"")
kvn
parents: 1498
diff changeset
  1444
#ifdef ASSERT
c1f73fa547fe 6784930: server jvm fails with assert(!n->is_SpillCopy(),"")
kvn
parents: 1498
diff changeset
  1445
  for (uint i = 0; i < _num_blocks; i++ ) {
c1f73fa547fe 6784930: server jvm fails with assert(!n->is_SpillCopy(),"")
kvn
parents: 1498
diff changeset
  1446
    Block *b = _blocks[i];
2131
98f9cef66a34 6810672: Comment typos
twisti
parents: 2127
diff changeset
  1447
    assert(b->_freq >= MIN_BLOCK_FREQUENCY, "Register Allocator requires meaningful block frequency");
2016
c1f73fa547fe 6784930: server jvm fails with assert(!n->is_SpillCopy(),"")
kvn
parents: 1498
diff changeset
  1448
  }
c1f73fa547fe 6784930: server jvm fails with assert(!n->is_SpillCopy(),"")
kvn
parents: 1498
diff changeset
  1449
#endif
c1f73fa547fe 6784930: server jvm fails with assert(!n->is_SpillCopy(),"")
kvn
parents: 1498
diff changeset
  1450
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1451
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1452
  if (PrintCFGBlockFreq) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1453
    tty->print_cr("CFG Block Frequencies");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1454
    _root_loop->dump_tree();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1455
    if (Verbose) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1456
      tty->print_cr("PhaseCFG dump");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1457
      dump();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1458
      tty->print_cr("Node dump");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1459
      _root->dump(99999);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1460
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1461
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1462
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1463
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1464
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1465
//----------------------------create_loop_tree--------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1466
// Create a loop tree from the CFG
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1467
CFGLoop* PhaseCFG::create_loop_tree() {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1468
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1469
#ifdef ASSERT
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1470
  assert( _blocks[0] == _broot, "" );
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1471
  for (uint i = 0; i < _num_blocks; i++ ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1472
    Block *b = _blocks[i];
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1473
    // Check that _loop field are clear...we could clear them if not.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1474
    assert(b->_loop == NULL, "clear _loop expected");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1475
    // Sanity check that the RPO numbering is reflected in the _blocks array.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1476
    // It doesn't have to be for the loop tree to be built, but if it is not,
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1477
    // then the blocks have been reordered since dom graph building...which
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1478
    // may question the RPO numbering
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1479
    assert(b->_rpo == i, "unexpected reverse post order number");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1480
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1481
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1482
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1483
  int idct = 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1484
  CFGLoop* root_loop = new CFGLoop(idct++);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1485
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1486
  Block_List worklist;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1487
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1488
  // Assign blocks to loops
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1489
  for(uint i = _num_blocks - 1; i > 0; i-- ) { // skip Root block
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1490
    Block *b = _blocks[i];
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1491
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1492
    if (b->head()->is_Loop()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1493
      Block* loop_head = b;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1494
      assert(loop_head->num_preds() - 1 == 2, "loop must have 2 predecessors");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1495
      Node* tail_n = loop_head->pred(LoopNode::LoopBackControl);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1496
      Block* tail = _bbs[tail_n->_idx];
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1497
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1498
      // Defensively filter out Loop nodes for non-single-entry loops.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1499
      // For all reasonable loops, the head occurs before the tail in RPO.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1500
      if (i <= tail->_rpo) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1501
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1502
        // The tail and (recursive) predecessors of the tail
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1503
        // are made members of a new loop.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1504
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1505
        assert(worklist.size() == 0, "nonempty worklist");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1506
        CFGLoop* nloop = new CFGLoop(idct++);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1507
        assert(loop_head->_loop == NULL, "just checking");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1508
        loop_head->_loop = nloop;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1509
        // Add to nloop so push_pred() will skip over inner loops
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1510
        nloop->add_member(loop_head);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1511
        nloop->push_pred(loop_head, LoopNode::LoopBackControl, worklist, _bbs);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1512
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1513
        while (worklist.size() > 0) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1514
          Block* member = worklist.pop();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1515
          if (member != loop_head) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1516
            for (uint j = 1; j < member->num_preds(); j++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1517
              nloop->push_pred(member, j, worklist, _bbs);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1518
            }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1519
          }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1520
        }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1521
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1522
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1523
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1524
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1525
  // Create a member list for each loop consisting
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1526
  // of both blocks and (immediate child) loops.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1527
  for (uint i = 0; i < _num_blocks; i++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1528
    Block *b = _blocks[i];
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1529
    CFGLoop* lp = b->_loop;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1530
    if (lp == NULL) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1531
      // Not assigned to a loop. Add it to the method's pseudo loop.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1532
      b->_loop = root_loop;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1533
      lp = root_loop;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1534
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1535
    if (lp == root_loop || b != lp->head()) { // loop heads are already members
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1536
      lp->add_member(b);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1537
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1538
    if (lp != root_loop) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1539
      if (lp->parent() == NULL) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1540
        // Not a nested loop. Make it a child of the method's pseudo loop.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1541
        root_loop->add_nested_loop(lp);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1542
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1543
      if (b == lp->head()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1544
        // Add nested loop to member list of parent loop.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1545
        lp->parent()->add_member(lp);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1546
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1547
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1548
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1549
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1550
  return root_loop;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1551
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1552
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1553
//------------------------------push_pred--------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1554
void CFGLoop::push_pred(Block* blk, int i, Block_List& worklist, Block_Array& node_to_blk) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1555
  Node* pred_n = blk->pred(i);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1556
  Block* pred = node_to_blk[pred_n->_idx];
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1557
  CFGLoop *pred_loop = pred->_loop;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1558
  if (pred_loop == NULL) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1559
    // Filter out blocks for non-single-entry loops.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1560
    // For all reasonable loops, the head occurs before the tail in RPO.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1561
    if (pred->_rpo > head()->_rpo) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1562
      pred->_loop = this;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1563
      worklist.push(pred);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1564
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1565
  } else if (pred_loop != this) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1566
    // Nested loop.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1567
    while (pred_loop->_parent != NULL && pred_loop->_parent != this) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1568
      pred_loop = pred_loop->_parent;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1569
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1570
    // Make pred's loop be a child
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1571
    if (pred_loop->_parent == NULL) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1572
      add_nested_loop(pred_loop);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1573
      // Continue with loop entry predecessor.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1574
      Block* pred_head = pred_loop->head();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1575
      assert(pred_head->num_preds() - 1 == 2, "loop must have 2 predecessors");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1576
      assert(pred_head != head(), "loop head in only one loop");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1577
      push_pred(pred_head, LoopNode::EntryControl, worklist, node_to_blk);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1578
    } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1579
      assert(pred_loop->_parent == this && _parent == NULL, "just checking");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1580
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1581
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1582
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1583
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1584
//------------------------------add_nested_loop--------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1585
// Make cl a child of the current loop in the loop tree.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1586
void CFGLoop::add_nested_loop(CFGLoop* cl) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1587
  assert(_parent == NULL, "no parent yet");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1588
  assert(cl != this, "not my own parent");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1589
  cl->_parent = this;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1590
  CFGLoop* ch = _child;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1591
  if (ch == NULL) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1592
    _child = cl;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1593
  } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1594
    while (ch->_sibling != NULL) { ch = ch->_sibling; }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1595
    ch->_sibling = cl;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1596
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1597
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1598
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1599
//------------------------------compute_loop_depth-----------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1600
// Store the loop depth in each CFGLoop object.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1601
// Recursively walk the children to do the same for them.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1602
void CFGLoop::compute_loop_depth(int depth) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1603
  _depth = depth;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1604
  CFGLoop* ch = _child;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1605
  while (ch != NULL) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1606
    ch->compute_loop_depth(depth + 1);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1607
    ch = ch->_sibling;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1608
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1609
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1610
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1611
//------------------------------compute_freq-----------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1612
// Compute the frequency of each block and loop, relative to a single entry
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1613
// into the dominating loop head.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1614
void CFGLoop::compute_freq() {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1615
  // Bottom up traversal of loop tree (visit inner loops first.)
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1616
  // Set loop head frequency to 1.0, then transitively
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1617
  // compute frequency for all successors in the loop,
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1618
  // as well as for each exit edge.  Inner loops are
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1619
  // treated as single blocks with loop exit targets
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1620
  // as the successor blocks.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1621
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1622
  // Nested loops first
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1623
  CFGLoop* ch = _child;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1624
  while (ch != NULL) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1625
    ch->compute_freq();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1626
    ch = ch->_sibling;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1627
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1628
  assert (_members.length() > 0, "no empty loops");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1629
  Block* hd = head();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1630
  hd->_freq = 1.0f;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1631
  for (int i = 0; i < _members.length(); i++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1632
    CFGElement* s = _members.at(i);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1633
    float freq = s->_freq;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1634
    if (s->is_block()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1635
      Block* b = s->as_Block();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1636
      for (uint j = 0; j < b->_num_succs; j++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1637
        Block* sb = b->_succs[j];
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1638
        update_succ_freq(sb, freq * b->succ_prob(j));
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1639
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1640
    } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1641
      CFGLoop* lp = s->as_CFGLoop();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1642
      assert(lp->_parent == this, "immediate child");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1643
      for (int k = 0; k < lp->_exits.length(); k++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1644
        Block* eb = lp->_exits.at(k).get_target();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1645
        float prob = lp->_exits.at(k).get_prob();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1646
        update_succ_freq(eb, freq * prob);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1647
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1648
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1649
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1650
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1651
  // For all loops other than the outer, "method" loop,
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1652
  // sum and normalize the exit probability. The "method" loop
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1653
  // should keep the initial exit probability of 1, so that
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1654
  // inner blocks do not get erroneously scaled.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1655
  if (_depth != 0) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1656
    // Total the exit probabilities for this loop.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1657
    float exits_sum = 0.0f;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1658
    for (int i = 0; i < _exits.length(); i++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1659
      exits_sum += _exits.at(i).get_prob();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1660
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1661
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1662
    // Normalize the exit probabilities. Until now, the
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1663
    // probabilities estimate the possibility of exit per
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1664
    // a single loop iteration; afterward, they estimate
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1665
    // the probability of exit per loop entry.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1666
    for (int i = 0; i < _exits.length(); i++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1667
      Block* et = _exits.at(i).get_target();
1498
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1668
      float new_prob = 0.0f;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1669
      if (_exits.at(i).get_prob() > 0.0f) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1670
        new_prob = _exits.at(i).get_prob() / exits_sum;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1671
      }
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1672
      BlockProbPair bpp(et, new_prob);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1673
      _exits.at_put(i, bpp);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1674
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1675
1498
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1676
    // Save the total, but guard against unreasonable probability,
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1677
    // as the value is used to estimate the loop trip count.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1678
    // An infinite trip count would blur relative block
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1679
    // frequencies.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1680
    if (exits_sum > 1.0f) exits_sum = 1.0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1681
    if (exits_sum < PROB_MIN) exits_sum = PROB_MIN;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1682
    _exit_prob = exits_sum;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1683
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1684
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1685
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1686
//------------------------------succ_prob-------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1687
// Determine the probability of reaching successor 'i' from the receiver block.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1688
float Block::succ_prob(uint i) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1689
  int eidx = end_idx();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1690
  Node *n = _nodes[eidx];  // Get ending Node
1070
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1691
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1692
  int op = n->Opcode();
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1693
  if (n->is_Mach()) {
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1694
    if (n->is_MachNullCheck()) {
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1695
      // Can only reach here if called after lcm. The original Op_If is gone,
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1696
      // so we attempt to infer the probability from one or both of the
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1697
      // successor blocks.
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1698
      assert(_num_succs == 2, "expecting 2 successors of a null check");
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1699
      // If either successor has only one predecessor, then the
2131
98f9cef66a34 6810672: Comment typos
twisti
parents: 2127
diff changeset
  1700
      // probability estimate can be derived using the
1070
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1701
      // relative frequency of the successor and this block.
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1702
      if (_succs[i]->num_preds() == 2) {
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1703
        return _succs[i]->_freq / _freq;
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1704
      } else if (_succs[1-i]->num_preds() == 2) {
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1705
        return 1 - (_succs[1-i]->_freq / _freq);
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1706
      } else {
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1707
        // Estimate using both successor frequencies
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1708
        float freq = _succs[i]->_freq;
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1709
        return freq / (freq + _succs[1-i]->_freq);
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1710
      }
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1711
    }
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1712
    op = n->as_Mach()->ideal_Opcode();
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1713
  }
e03de091796e 6611837: block frequency is zero
rasbold
parents: 781
diff changeset
  1714
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1715
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1716
  // Switch on branch type
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1717
  switch( op ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1718
  case Op_CountedLoopEnd:
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1719
  case Op_If: {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1720
    assert (i < 2, "just checking");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1721
    // Conditionals pass on only part of their frequency
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1722
    float prob  = n->as_MachIf()->_prob;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1723
    assert(prob >= 0.0 && prob <= 1.0, "out of range probability");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1724
    // If succ[i] is the FALSE branch, invert path info
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1725
    if( _nodes[i + eidx + 1]->Opcode() == Op_IfFalse ) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1726
      return 1.0f - prob; // not taken
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1727
    } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1728
      return prob; // taken
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1729
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1730
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1731
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1732
  case Op_Jump:
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1733
    // Divide the frequency between all successors evenly
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1734
    return 1.0f/_num_succs;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1735
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1736
  case Op_Catch: {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1737
    const CatchProjNode *ci = _nodes[i + eidx + 1]->as_CatchProj();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1738
    if (ci->_con == CatchProjNode::fall_through_index) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1739
      // Fall-thru path gets the lion's share.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1740
      return 1.0f - PROB_UNLIKELY_MAG(5)*_num_succs;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1741
    } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1742
      // Presume exceptional paths are equally unlikely
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1743
      return PROB_UNLIKELY_MAG(5);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1744
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1745
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1746
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1747
  case Op_Root:
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1748
  case Op_Goto:
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1749
    // Pass frequency straight thru to target
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1750
    return 1.0f;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1751
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1752
  case Op_NeverBranch:
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1753
    return 0.0f;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1754
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1755
  case Op_TailCall:
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1756
  case Op_TailJump:
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1757
  case Op_Return:
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1758
  case Op_Halt:
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1759
  case Op_Rethrow:
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1760
    // Do not push out freq to root block
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1761
    return 0.0f;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1762
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1763
  default:
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1764
    ShouldNotReachHere();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1765
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1766
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1767
  return 0.0f;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1768
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1769
1498
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1770
//------------------------------num_fall_throughs-----------------------------
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1771
// Return the number of fall-through candidates for a block
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1772
int Block::num_fall_throughs() {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1773
  int eidx = end_idx();
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1774
  Node *n = _nodes[eidx];  // Get ending Node
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1775
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1776
  int op = n->Opcode();
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1777
  if (n->is_Mach()) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1778
    if (n->is_MachNullCheck()) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1779
      // In theory, either side can fall-thru, for simplicity sake,
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1780
      // let's say only the false branch can now.
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1781
      return 1;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1782
    }
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1783
    op = n->as_Mach()->ideal_Opcode();
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1784
  }
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1785
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1786
  // Switch on branch type
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1787
  switch( op ) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1788
  case Op_CountedLoopEnd:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1789
  case Op_If:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1790
    return 2;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1791
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1792
  case Op_Root:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1793
  case Op_Goto:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1794
    return 1;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1795
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1796
  case Op_Catch: {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1797
    for (uint i = 0; i < _num_succs; i++) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1798
      const CatchProjNode *ci = _nodes[i + eidx + 1]->as_CatchProj();
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1799
      if (ci->_con == CatchProjNode::fall_through_index) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1800
        return 1;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1801
      }
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1802
    }
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1803
    return 0;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1804
  }
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1805
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1806
  case Op_Jump:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1807
  case Op_NeverBranch:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1808
  case Op_TailCall:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1809
  case Op_TailJump:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1810
  case Op_Return:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1811
  case Op_Halt:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1812
  case Op_Rethrow:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1813
    return 0;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1814
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1815
  default:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1816
    ShouldNotReachHere();
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1817
  }
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1818
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1819
  return 0;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1820
}
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1821
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1822
//------------------------------succ_fall_through-----------------------------
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1823
// Return true if a specific successor could be fall-through target.
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1824
bool Block::succ_fall_through(uint i) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1825
  int eidx = end_idx();
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1826
  Node *n = _nodes[eidx];  // Get ending Node
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1827
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1828
  int op = n->Opcode();
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1829
  if (n->is_Mach()) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1830
    if (n->is_MachNullCheck()) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1831
      // In theory, either side can fall-thru, for simplicity sake,
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1832
      // let's say only the false branch can now.
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1833
      return _nodes[i + eidx + 1]->Opcode() == Op_IfFalse;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1834
    }
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1835
    op = n->as_Mach()->ideal_Opcode();
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1836
  }
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1837
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1838
  // Switch on branch type
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1839
  switch( op ) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1840
  case Op_CountedLoopEnd:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1841
  case Op_If:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1842
  case Op_Root:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1843
  case Op_Goto:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1844
    return true;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1845
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1846
  case Op_Catch: {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1847
    const CatchProjNode *ci = _nodes[i + eidx + 1]->as_CatchProj();
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1848
    return ci->_con == CatchProjNode::fall_through_index;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1849
  }
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1850
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1851
  case Op_Jump:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1852
  case Op_NeverBranch:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1853
  case Op_TailCall:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1854
  case Op_TailJump:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1855
  case Op_Return:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1856
  case Op_Halt:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1857
  case Op_Rethrow:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1858
    return false;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1859
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1860
  default:
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1861
    ShouldNotReachHere();
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1862
  }
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1863
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1864
  return false;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1865
}
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1866
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1867
//------------------------------update_uncommon_branch------------------------
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1868
// Update the probability of a two-branch to be uncommon
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1869
void Block::update_uncommon_branch(Block* ub) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1870
  int eidx = end_idx();
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1871
  Node *n = _nodes[eidx];  // Get ending Node
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1872
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1873
  int op = n->as_Mach()->ideal_Opcode();
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1874
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1875
  assert(op == Op_CountedLoopEnd || op == Op_If, "must be a If");
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1876
  assert(num_fall_throughs() == 2, "must be a two way branch block");
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1877
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1878
  // Which successor is ub?
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1879
  uint s;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1880
  for (s = 0; s <_num_succs; s++) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1881
    if (_succs[s] == ub) break;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1882
  }
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1883
  assert(s < 2, "uncommon successor must be found");
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1884
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1885
  // If ub is the true path, make the proability small, else
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1886
  // ub is the false path, and make the probability large
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1887
  bool invert = (_nodes[s + eidx + 1]->Opcode() == Op_IfFalse);
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1888
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1889
  // Get existing probability
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1890
  float p = n->as_MachIf()->_prob;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1891
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1892
  if (invert) p = 1.0 - p;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1893
  if (p > PROB_MIN) {
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1894
    p = PROB_MIN;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1895
  }
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1896
  if (invert) p = 1.0 - p;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1897
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1898
  n->as_MachIf()->_prob = p;
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1899
}
346bf226078e 6743900: frequency based block layout
rasbold
parents: 1070
diff changeset
  1900
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1901
//------------------------------update_succ_freq-------------------------------
2131
98f9cef66a34 6810672: Comment typos
twisti
parents: 2127
diff changeset
  1902
// Update the appropriate frequency associated with block 'b', a successor of
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1903
// a block in this loop.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1904
void CFGLoop::update_succ_freq(Block* b, float freq) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1905
  if (b->_loop == this) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1906
    if (b == head()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1907
      // back branch within the loop
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1908
      // Do nothing now, the loop carried frequency will be
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1909
      // adjust later in scale_freq().
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1910
    } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1911
      // simple branch within the loop
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1912
      b->_freq += freq;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1913
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1914
  } else if (!in_loop_nest(b)) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1915
    // branch is exit from this loop
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1916
    BlockProbPair bpp(b, freq);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1917
    _exits.append(bpp);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1918
  } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1919
    // branch into nested loop
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1920
    CFGLoop* ch = b->_loop;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1921
    ch->_freq += freq;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1922
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1923
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1924
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1925
//------------------------------in_loop_nest-----------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1926
// Determine if block b is in the receiver's loop nest.
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1927
bool CFGLoop::in_loop_nest(Block* b) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1928
  int depth = _depth;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1929
  CFGLoop* b_loop = b->_loop;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1930
  int b_depth = b_loop->_depth;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1931
  if (depth == b_depth) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1932
    return true;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1933
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1934
  while (b_depth > depth) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1935
    b_loop = b_loop->_parent;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1936
    b_depth = b_loop->_depth;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1937
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1938
  return b_loop == this;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1939
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1940
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1941
//------------------------------scale_freq-------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1942
// Scale frequency of loops and blocks by trip counts from outer loops
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1943
// Do a top down traversal of loop tree (visit outer loops first.)
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1944
void CFGLoop::scale_freq() {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1945
  float loop_freq = _freq * trip_count();
2340
cb47f8209cd8 6810845: Performance regression in mpegaudio on x64
kvn
parents: 2154
diff changeset
  1946
  _freq = loop_freq;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1947
  for (int i = 0; i < _members.length(); i++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1948
    CFGElement* s = _members.at(i);
2016
c1f73fa547fe 6784930: server jvm fails with assert(!n->is_SpillCopy(),"")
kvn
parents: 1498
diff changeset
  1949
    float block_freq = s->_freq * loop_freq;
2147
9088094e3e81 6812721: Block's frequency should not be NaN
kvn
parents: 2131
diff changeset
  1950
    if (g_isnan(block_freq) || block_freq < MIN_BLOCK_FREQUENCY)
9088094e3e81 6812721: Block's frequency should not be NaN
kvn
parents: 2131
diff changeset
  1951
      block_freq = MIN_BLOCK_FREQUENCY;
2016
c1f73fa547fe 6784930: server jvm fails with assert(!n->is_SpillCopy(),"")
kvn
parents: 1498
diff changeset
  1952
    s->_freq = block_freq;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1953
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1954
  CFGLoop* ch = _child;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1955
  while (ch != NULL) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1956
    ch->scale_freq();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1957
    ch = ch->_sibling;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1958
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1959
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1960
2340
cb47f8209cd8 6810845: Performance regression in mpegaudio on x64
kvn
parents: 2154
diff changeset
  1961
// Frequency of outer loop
cb47f8209cd8 6810845: Performance regression in mpegaudio on x64
kvn
parents: 2154
diff changeset
  1962
float CFGLoop::outer_loop_freq() const {
cb47f8209cd8 6810845: Performance regression in mpegaudio on x64
kvn
parents: 2154
diff changeset
  1963
  if (_child != NULL) {
cb47f8209cd8 6810845: Performance regression in mpegaudio on x64
kvn
parents: 2154
diff changeset
  1964
    return _child->_freq;
cb47f8209cd8 6810845: Performance regression in mpegaudio on x64
kvn
parents: 2154
diff changeset
  1965
  }
cb47f8209cd8 6810845: Performance regression in mpegaudio on x64
kvn
parents: 2154
diff changeset
  1966
  return _freq;
cb47f8209cd8 6810845: Performance regression in mpegaudio on x64
kvn
parents: 2154
diff changeset
  1967
}
cb47f8209cd8 6810845: Performance regression in mpegaudio on x64
kvn
parents: 2154
diff changeset
  1968
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1969
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1970
//------------------------------dump_tree--------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1971
void CFGLoop::dump_tree() const {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1972
  dump();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1973
  if (_child != NULL)   _child->dump_tree();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1974
  if (_sibling != NULL) _sibling->dump_tree();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1975
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1976
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1977
//------------------------------dump-------------------------------------------
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1978
void CFGLoop::dump() const {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1979
  for (int i = 0; i < _depth; i++) tty->print("   ");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1980
  tty->print("%s: %d  trip_count: %6.0f freq: %6.0f\n",
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1981
             _depth == 0 ? "Method" : "Loop", _id, trip_count(), _freq);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1982
  for (int i = 0; i < _depth; i++) tty->print("   ");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1983
  tty->print("         members:", _id);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1984
  int k = 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1985
  for (int i = 0; i < _members.length(); i++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1986
    if (k++ >= 6) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1987
      tty->print("\n              ");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1988
      for (int j = 0; j < _depth+1; j++) tty->print("   ");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1989
      k = 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1990
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1991
    CFGElement *s = _members.at(i);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1992
    if (s->is_block()) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1993
      Block *b = s->as_Block();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1994
      tty->print(" B%d(%6.3f)", b->_pre_order, b->_freq);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1995
    } else {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1996
      CFGLoop* lp = s->as_CFGLoop();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1997
      tty->print(" L%d(%6.3f)", lp->_id, lp->_freq);
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1998
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  1999
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  2000
  tty->print("\n");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  2001
  for (int i = 0; i < _depth; i++) tty->print("   ");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  2002
  tty->print("         exits:  ");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  2003
  k = 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  2004
  for (int i = 0; i < _exits.length(); i++) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  2005
    if (k++ >= 7) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
  2006
      tty->print("\n              ");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  2007
      for (int j = 0; j < _depth+1; j++) tty->print("   ");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  2008
      k = 0;
489c9b5090e2 Initial load
duke
parents:
diff changeset
  2009
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  2010
    Block *blk = _exits.at(i).get_target();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  2011
    float prob = _exits.at(i).get_prob();
489c9b5090e2 Initial load
duke
parents:
diff changeset
  2012
    tty->print(" ->%d@%d%%", blk->_pre_order, (int)(prob*100));
489c9b5090e2 Initial load
duke
parents:
diff changeset
  2013
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
  2014
  tty->print("\n");
489c9b5090e2 Initial load
duke
parents:
diff changeset
  2015
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
  2016
#endif