jdk-sandbox: hotspot/src/share/vm/opto/loopTransform.cpp@489c9b5090e2 (annotated)

1 489c9b5090e2 Initial load duke parents: diff changeset	1	/*
489c9b5090e2 Initial load duke parents: diff changeset	2	* Copyright 2000-2007 Sun Microsystems, Inc. All Rights Reserved.
489c9b5090e2 Initial load duke parents: diff changeset	3	* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
489c9b5090e2 Initial load duke parents: diff changeset	4	*
489c9b5090e2 Initial load duke parents: diff changeset	5	* This code is free software; you can redistribute it and/or modify it
489c9b5090e2 Initial load duke parents: diff changeset	6	* under the terms of the GNU General Public License version 2 only, as
489c9b5090e2 Initial load duke parents: diff changeset	7	* published by the Free Software Foundation.
489c9b5090e2 Initial load duke parents: diff changeset	8	*
489c9b5090e2 Initial load duke parents: diff changeset	9	* This code is distributed in the hope that it will be useful, but WITHOUT
489c9b5090e2 Initial load duke parents: diff changeset	10	* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
489c9b5090e2 Initial load duke parents: diff changeset	11	* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
489c9b5090e2 Initial load duke parents: diff changeset	12	* version 2 for more details (a copy is included in the LICENSE file that
489c9b5090e2 Initial load duke parents: diff changeset	13	* accompanied this code).
489c9b5090e2 Initial load duke parents: diff changeset	14	*
489c9b5090e2 Initial load duke parents: diff changeset	15	* You should have received a copy of the GNU General Public License version
489c9b5090e2 Initial load duke parents: diff changeset	16	* 2 along with this work; if not, write to the Free Software Foundation,
489c9b5090e2 Initial load duke parents: diff changeset	17	* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
489c9b5090e2 Initial load duke parents: diff changeset	18	*
489c9b5090e2 Initial load duke parents: diff changeset	19	* Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
489c9b5090e2 Initial load duke parents: diff changeset	20	* CA 95054 USA or visit www.sun.com if you need additional information or
489c9b5090e2 Initial load duke parents: diff changeset	21	* have any questions.
489c9b5090e2 Initial load duke parents: diff changeset	22	*
489c9b5090e2 Initial load duke parents: diff changeset	23	*/
489c9b5090e2 Initial load duke parents: diff changeset	24
489c9b5090e2 Initial load duke parents: diff changeset	25	#include "incls/_precompiled.incl"
489c9b5090e2 Initial load duke parents: diff changeset	26	#include "incls/_loopTransform.cpp.incl"
489c9b5090e2 Initial load duke parents: diff changeset	27
489c9b5090e2 Initial load duke parents: diff changeset	28	//------------------------------is_loop_exit-----------------------------------
489c9b5090e2 Initial load duke parents: diff changeset	29	// Given an IfNode, return the loop-exiting projection or NULL if both
489c9b5090e2 Initial load duke parents: diff changeset	30	// arms remain in the loop.
489c9b5090e2 Initial load duke parents: diff changeset	31	Node IdealLoopTree::is_loop_exit(Node iff) const {
489c9b5090e2 Initial load duke parents: diff changeset	32	if( iff->outcnt() != 2 ) return NULL; // Ignore partially dead tests
489c9b5090e2 Initial load duke parents: diff changeset	33	PhaseIdealLoop *phase = _phase;
489c9b5090e2 Initial load duke parents: diff changeset	34	// Test is an IfNode, has 2 projections. If BOTH are in the loop
489c9b5090e2 Initial load duke parents: diff changeset	35	// we need loop unswitching instead of peeling.
489c9b5090e2 Initial load duke parents: diff changeset	36	if( !is_member(phase->get_loop( iff->raw_out(0) )) )
489c9b5090e2 Initial load duke parents: diff changeset	37	return iff->raw_out(0);
489c9b5090e2 Initial load duke parents: diff changeset	38	if( !is_member(phase->get_loop( iff->raw_out(1) )) )
489c9b5090e2 Initial load duke parents: diff changeset	39	return iff->raw_out(1);
489c9b5090e2 Initial load duke parents: diff changeset	40	return NULL;
489c9b5090e2 Initial load duke parents: diff changeset	41	}
489c9b5090e2 Initial load duke parents: diff changeset	42
489c9b5090e2 Initial load duke parents: diff changeset	43
489c9b5090e2 Initial load duke parents: diff changeset	44	//=============================================================================
489c9b5090e2 Initial load duke parents: diff changeset	45
489c9b5090e2 Initial load duke parents: diff changeset	46
489c9b5090e2 Initial load duke parents: diff changeset	47	//------------------------------record_for_igvn----------------------------
489c9b5090e2 Initial load duke parents: diff changeset	48	// Put loop body on igvn work list
489c9b5090e2 Initial load duke parents: diff changeset	49	void IdealLoopTree::record_for_igvn() {
489c9b5090e2 Initial load duke parents: diff changeset	50	for( uint i = 0; i < _body.size(); i++ ) {
489c9b5090e2 Initial load duke parents: diff changeset	51	Node *n = _body.at(i);
489c9b5090e2 Initial load duke parents: diff changeset	52	_phase->_igvn._worklist.push(n);
489c9b5090e2 Initial load duke parents: diff changeset	53	}
489c9b5090e2 Initial load duke parents: diff changeset	54	}
489c9b5090e2 Initial load duke parents: diff changeset	55
489c9b5090e2 Initial load duke parents: diff changeset	56	//------------------------------compute_profile_trip_cnt----------------------------
489c9b5090e2 Initial load duke parents: diff changeset	57	// Compute loop trip count from profile data as
489c9b5090e2 Initial load duke parents: diff changeset	58	// (backedge_count + loop_exit_count) / loop_exit_count
489c9b5090e2 Initial load duke parents: diff changeset	59	void IdealLoopTree::compute_profile_trip_cnt( PhaseIdealLoop *phase ) {
489c9b5090e2 Initial load duke parents: diff changeset	60	if (!_head->is_CountedLoop()) {
489c9b5090e2 Initial load duke parents: diff changeset	61	return;
489c9b5090e2 Initial load duke parents: diff changeset	62	}
489c9b5090e2 Initial load duke parents: diff changeset	63	CountedLoopNode* head = _head->as_CountedLoop();
489c9b5090e2 Initial load duke parents: diff changeset	64	if (head->profile_trip_cnt() != COUNT_UNKNOWN) {
489c9b5090e2 Initial load duke parents: diff changeset	65	return; // Already computed
489c9b5090e2 Initial load duke parents: diff changeset	66	}
489c9b5090e2 Initial load duke parents: diff changeset	67	float trip_cnt = (float)max_jint; // default is big
489c9b5090e2 Initial load duke parents: diff changeset	68
489c9b5090e2 Initial load duke parents: diff changeset	69	Node* back = head->in(LoopNode::LoopBackControl);
489c9b5090e2 Initial load duke parents: diff changeset	70	while (back != head) {
489c9b5090e2 Initial load duke parents: diff changeset	71	if ((back->Opcode() == Op_IfTrue \|\| back->Opcode() == Op_IfFalse) &&
489c9b5090e2 Initial load duke parents: diff changeset	72	back->in(0) &&
489c9b5090e2 Initial load duke parents: diff changeset	73	back->in(0)->is_If() &&
489c9b5090e2 Initial load duke parents: diff changeset	74	back->in(0)->as_If()->_fcnt != COUNT_UNKNOWN &&
489c9b5090e2 Initial load duke parents: diff changeset	75	back->in(0)->as_If()->_prob != PROB_UNKNOWN) {
489c9b5090e2 Initial load duke parents: diff changeset	76	break;
489c9b5090e2 Initial load duke parents: diff changeset	77	}
489c9b5090e2 Initial load duke parents: diff changeset	78	back = phase->idom(back);
489c9b5090e2 Initial load duke parents: diff changeset	79	}
489c9b5090e2 Initial load duke parents: diff changeset	80	if (back != head) {
489c9b5090e2 Initial load duke parents: diff changeset	81	assert((back->Opcode() == Op_IfTrue \|\| back->Opcode() == Op_IfFalse) &&
489c9b5090e2 Initial load duke parents: diff changeset	82	back->in(0), "if-projection exists");
489c9b5090e2 Initial load duke parents: diff changeset	83	IfNode* back_if = back->in(0)->as_If();
489c9b5090e2 Initial load duke parents: diff changeset	84	float loop_back_cnt = back_if->_fcnt * back_if->_prob;
489c9b5090e2 Initial load duke parents: diff changeset	85
489c9b5090e2 Initial load duke parents: diff changeset	86	// Now compute a loop exit count
489c9b5090e2 Initial load duke parents: diff changeset	87	float loop_exit_cnt = 0.0f;
489c9b5090e2 Initial load duke parents: diff changeset	88	for( uint i = 0; i < _body.size(); i++ ) {
489c9b5090e2 Initial load duke parents: diff changeset	89	Node *n = _body[i];
489c9b5090e2 Initial load duke parents: diff changeset	90	if( n->is_If() ) {
489c9b5090e2 Initial load duke parents: diff changeset	91	IfNode *iff = n->as_If();
489c9b5090e2 Initial load duke parents: diff changeset	92	if( iff->_fcnt != COUNT_UNKNOWN && iff->_prob != PROB_UNKNOWN ) {
489c9b5090e2 Initial load duke parents: diff changeset	93	Node *exit = is_loop_exit(iff);
489c9b5090e2 Initial load duke parents: diff changeset	94	if( exit ) {
489c9b5090e2 Initial load duke parents: diff changeset	95	float exit_prob = iff->_prob;
489c9b5090e2 Initial load duke parents: diff changeset	96	if (exit->Opcode() == Op_IfFalse) exit_prob = 1.0 - exit_prob;
489c9b5090e2 Initial load duke parents: diff changeset	97	if (exit_prob > PROB_MIN) {
489c9b5090e2 Initial load duke parents: diff changeset	98	float exit_cnt = iff->_fcnt * exit_prob;
489c9b5090e2 Initial load duke parents: diff changeset	99	loop_exit_cnt += exit_cnt;
489c9b5090e2 Initial load duke parents: diff changeset	100	}
489c9b5090e2 Initial load duke parents: diff changeset	101	}
489c9b5090e2 Initial load duke parents: diff changeset	102	}
489c9b5090e2 Initial load duke parents: diff changeset	103	}
489c9b5090e2 Initial load duke parents: diff changeset	104	}
489c9b5090e2 Initial load duke parents: diff changeset	105	if (loop_exit_cnt > 0.0f) {
489c9b5090e2 Initial load duke parents: diff changeset	106	trip_cnt = (loop_back_cnt + loop_exit_cnt) / loop_exit_cnt;
489c9b5090e2 Initial load duke parents: diff changeset	107	} else {
489c9b5090e2 Initial load duke parents: diff changeset	108	// No exit count so use
489c9b5090e2 Initial load duke parents: diff changeset	109	trip_cnt = loop_back_cnt;
489c9b5090e2 Initial load duke parents: diff changeset	110	}
489c9b5090e2 Initial load duke parents: diff changeset	111	}
489c9b5090e2 Initial load duke parents: diff changeset	112	#ifndef PRODUCT
489c9b5090e2 Initial load duke parents: diff changeset	113	if (TraceProfileTripCount) {
489c9b5090e2 Initial load duke parents: diff changeset	114	tty->print_cr("compute_profile_trip_cnt lp: %d cnt: %f\n", head->_idx, trip_cnt);
489c9b5090e2 Initial load duke parents: diff changeset	115	}
489c9b5090e2 Initial load duke parents: diff changeset	116	#endif
489c9b5090e2 Initial load duke parents: diff changeset	117	head->set_profile_trip_cnt(trip_cnt);
489c9b5090e2 Initial load duke parents: diff changeset	118	}
489c9b5090e2 Initial load duke parents: diff changeset	119
489c9b5090e2 Initial load duke parents: diff changeset	120	//---------------------is_invariant_addition-----------------------------
489c9b5090e2 Initial load duke parents: diff changeset	121	// Return nonzero index of invariant operand for an Add or Sub
489c9b5090e2 Initial load duke parents: diff changeset	122	// of (nonconstant) invariant and variant values. Helper for reassoicate_invariants.
489c9b5090e2 Initial load duke parents: diff changeset	123	int IdealLoopTree::is_invariant_addition(Node* n, PhaseIdealLoop *phase) {
489c9b5090e2 Initial load duke parents: diff changeset	124	int op = n->Opcode();
489c9b5090e2 Initial load duke parents: diff changeset	125	if (op == Op_AddI \|\| op == Op_SubI) {
489c9b5090e2 Initial load duke parents: diff changeset	126	bool in1_invar = this->is_invariant(n->in(1));
489c9b5090e2 Initial load duke parents: diff changeset	127	bool in2_invar = this->is_invariant(n->in(2));
489c9b5090e2 Initial load duke parents: diff changeset	128	if (in1_invar && !in2_invar) return 1;
489c9b5090e2 Initial load duke parents: diff changeset	129	if (!in1_invar && in2_invar) return 2;
489c9b5090e2 Initial load duke parents: diff changeset	130	}
489c9b5090e2 Initial load duke parents: diff changeset	131	return 0;
489c9b5090e2 Initial load duke parents: diff changeset	132	}
489c9b5090e2 Initial load duke parents: diff changeset	133
489c9b5090e2 Initial load duke parents: diff changeset	134	//---------------------reassociate_add_sub-----------------------------
489c9b5090e2 Initial load duke parents: diff changeset	135	// Reassociate invariant add and subtract expressions:
489c9b5090e2 Initial load duke parents: diff changeset	136	//
489c9b5090e2 Initial load duke parents: diff changeset	137	// inv1 + (x + inv2) => ( inv1 + inv2) + x
489c9b5090e2 Initial load duke parents: diff changeset	138	// (x + inv2) + inv1 => ( inv1 + inv2) + x
489c9b5090e2 Initial load duke parents: diff changeset	139	// inv1 + (x - inv2) => ( inv1 - inv2) + x
489c9b5090e2 Initial load duke parents: diff changeset	140	// inv1 - (inv2 - x) => ( inv1 - inv2) + x
489c9b5090e2 Initial load duke parents: diff changeset	141	// (x + inv2) - inv1 => (-inv1 + inv2) + x
489c9b5090e2 Initial load duke parents: diff changeset	142	// (x - inv2) + inv1 => ( inv1 - inv2) + x
489c9b5090e2 Initial load duke parents: diff changeset	143	// (x - inv2) - inv1 => (-inv1 - inv2) + x
489c9b5090e2 Initial load duke parents: diff changeset	144	// inv1 + (inv2 - x) => ( inv1 + inv2) - x
489c9b5090e2 Initial load duke parents: diff changeset	145	// inv1 - (x - inv2) => ( inv1 + inv2) - x
489c9b5090e2 Initial load duke parents: diff changeset	146	// (inv2 - x) + inv1 => ( inv1 + inv2) - x
489c9b5090e2 Initial load duke parents: diff changeset	147	// (inv2 - x) - inv1 => (-inv1 + inv2) - x
489c9b5090e2 Initial load duke parents: diff changeset	148	// inv1 - (x + inv2) => ( inv1 - inv2) - x
489c9b5090e2 Initial load duke parents: diff changeset	149	//
489c9b5090e2 Initial load duke parents: diff changeset	150	Node* IdealLoopTree::reassociate_add_sub(Node* n1, PhaseIdealLoop *phase) {
489c9b5090e2 Initial load duke parents: diff changeset	151	if (!n1->is_Add() && !n1->is_Sub() \|\| n1->outcnt() == 0) return NULL;
489c9b5090e2 Initial load duke parents: diff changeset	152	if (is_invariant(n1)) return NULL;
489c9b5090e2 Initial load duke parents: diff changeset	153	int inv1_idx = is_invariant_addition(n1, phase);
489c9b5090e2 Initial load duke parents: diff changeset	154	if (!inv1_idx) return NULL;
489c9b5090e2 Initial load duke parents: diff changeset	155	// Don't mess with add of constant (igvn moves them to expression tree root.)
489c9b5090e2 Initial load duke parents: diff changeset	156	if (n1->is_Add() && n1->in(2)->is_Con()) return NULL;
489c9b5090e2 Initial load duke parents: diff changeset	157	Node* inv1 = n1->in(inv1_idx);
489c9b5090e2 Initial load duke parents: diff changeset	158	Node* n2 = n1->in(3 - inv1_idx);
489c9b5090e2 Initial load duke parents: diff changeset	159	int inv2_idx = is_invariant_addition(n2, phase);
489c9b5090e2 Initial load duke parents: diff changeset	160	if (!inv2_idx) return NULL;
489c9b5090e2 Initial load duke parents: diff changeset	161	Node* x = n2->in(3 - inv2_idx);
489c9b5090e2 Initial load duke parents: diff changeset	162	Node* inv2 = n2->in(inv2_idx);
489c9b5090e2 Initial load duke parents: diff changeset	163
489c9b5090e2 Initial load duke parents: diff changeset	164	bool neg_x = n2->is_Sub() && inv2_idx == 1;
489c9b5090e2 Initial load duke parents: diff changeset	165	bool neg_inv2 = n2->is_Sub() && inv2_idx == 2;
489c9b5090e2 Initial load duke parents: diff changeset	166	bool neg_inv1 = n1->is_Sub() && inv1_idx == 2;
489c9b5090e2 Initial load duke parents: diff changeset	167	if (n1->is_Sub() && inv1_idx == 1) {
489c9b5090e2 Initial load duke parents: diff changeset	168	neg_x = !neg_x;
489c9b5090e2 Initial load duke parents: diff changeset	169	neg_inv2 = !neg_inv2;
489c9b5090e2 Initial load duke parents: diff changeset	170	}
489c9b5090e2 Initial load duke parents: diff changeset	171	Node* inv1_c = phase->get_ctrl(inv1);
489c9b5090e2 Initial load duke parents: diff changeset	172	Node* inv2_c = phase->get_ctrl(inv2);
489c9b5090e2 Initial load duke parents: diff changeset	173	Node* n_inv1;
489c9b5090e2 Initial load duke parents: diff changeset	174	if (neg_inv1) {
489c9b5090e2 Initial load duke parents: diff changeset	175	Node *zero = phase->_igvn.intcon(0);
489c9b5090e2 Initial load duke parents: diff changeset	176	phase->set_ctrl(zero, phase->C->root());
489c9b5090e2 Initial load duke parents: diff changeset	177	n_inv1 = new (phase->C, 3) SubINode(zero, inv1);
489c9b5090e2 Initial load duke parents: diff changeset	178	phase->register_new_node(n_inv1, inv1_c);
489c9b5090e2 Initial load duke parents: diff changeset	179	} else {
489c9b5090e2 Initial load duke parents: diff changeset	180	n_inv1 = inv1;
489c9b5090e2 Initial load duke parents: diff changeset	181	}
489c9b5090e2 Initial load duke parents: diff changeset	182	Node* inv;
489c9b5090e2 Initial load duke parents: diff changeset	183	if (neg_inv2) {
489c9b5090e2 Initial load duke parents: diff changeset	184	inv = new (phase->C, 3) SubINode(n_inv1, inv2);
489c9b5090e2 Initial load duke parents: diff changeset	185	} else {
489c9b5090e2 Initial load duke parents: diff changeset	186	inv = new (phase->C, 3) AddINode(n_inv1, inv2);
489c9b5090e2 Initial load duke parents: diff changeset	187	}
489c9b5090e2 Initial load duke parents: diff changeset	188	phase->register_new_node(inv, phase->get_early_ctrl(inv));
489c9b5090e2 Initial load duke parents: diff changeset	189
489c9b5090e2 Initial load duke parents: diff changeset	190	Node* addx;
489c9b5090e2 Initial load duke parents: diff changeset	191	if (neg_x) {
489c9b5090e2 Initial load duke parents: diff changeset	192	addx = new (phase->C, 3) SubINode(inv, x);
489c9b5090e2 Initial load duke parents: diff changeset	193	} else {
489c9b5090e2 Initial load duke parents: diff changeset	194	addx = new (phase->C, 3) AddINode(x, inv);
489c9b5090e2 Initial load duke parents: diff changeset	195	}
489c9b5090e2 Initial load duke parents: diff changeset	196	phase->register_new_node(addx, phase->get_ctrl(x));
489c9b5090e2 Initial load duke parents: diff changeset	197	phase->_igvn.hash_delete(n1);
489c9b5090e2 Initial load duke parents: diff changeset	198	phase->_igvn.subsume_node(n1, addx);
489c9b5090e2 Initial load duke parents: diff changeset	199	return addx;
489c9b5090e2 Initial load duke parents: diff changeset	200	}
489c9b5090e2 Initial load duke parents: diff changeset	201
489c9b5090e2 Initial load duke parents: diff changeset	202	//---------------------reassociate_invariants-----------------------------
489c9b5090e2 Initial load duke parents: diff changeset	203	// Reassociate invariant expressions:
489c9b5090e2 Initial load duke parents: diff changeset	204	void IdealLoopTree::reassociate_invariants(PhaseIdealLoop *phase) {
489c9b5090e2 Initial load duke parents: diff changeset	205	for (int i = _body.size() - 1; i >= 0; i--) {
489c9b5090e2 Initial load duke parents: diff changeset	206	Node *n = _body.at(i);
489c9b5090e2 Initial load duke parents: diff changeset	207	for (int j = 0; j < 5; j++) {
489c9b5090e2 Initial load duke parents: diff changeset	208	Node* nn = reassociate_add_sub(n, phase);
489c9b5090e2 Initial load duke parents: diff changeset	209	if (nn == NULL) break;
489c9b5090e2 Initial load duke parents: diff changeset	210	n = nn; // again
489c9b5090e2 Initial load duke parents: diff changeset	211	};
489c9b5090e2 Initial load duke parents: diff changeset	212	}
489c9b5090e2 Initial load duke parents: diff changeset	213	}
489c9b5090e2 Initial load duke parents: diff changeset	214
489c9b5090e2 Initial load duke parents: diff changeset	215	//------------------------------policy_peeling---------------------------------
489c9b5090e2 Initial load duke parents: diff changeset	216	// Return TRUE or FALSE if the loop should be peeled or not. Peel if we can
489c9b5090e2 Initial load duke parents: diff changeset	217	// make some loop-invariant test (usually a null-check) happen before the loop.
489c9b5090e2 Initial load duke parents: diff changeset	218	bool IdealLoopTree::policy_peeling( PhaseIdealLoop *phase ) const {
489c9b5090e2 Initial load duke parents: diff changeset	219	Node test = ((IdealLoopTree)this)->tail();
489c9b5090e2 Initial load duke parents: diff changeset	220	int body_size = ((IdealLoopTree*)this)->_body.size();
489c9b5090e2 Initial load duke parents: diff changeset	221	int uniq = phase->C->unique();
489c9b5090e2 Initial load duke parents: diff changeset	222	// Peeling does loop cloning which can result in O(N^2) node construction
489c9b5090e2 Initial load duke parents: diff changeset	223	if( body_size > 255 /* Prevent overflow for large body_size */
489c9b5090e2 Initial load duke parents: diff changeset	224	\|\| (body_size * body_size + uniq > MaxNodeLimit) ) {
489c9b5090e2 Initial load duke parents: diff changeset	225	return false; // too large to safely clone
489c9b5090e2 Initial load duke parents: diff changeset	226	}
489c9b5090e2 Initial load duke parents: diff changeset	227	while( test != _head ) { // Scan till run off top of loop
489c9b5090e2 Initial load duke parents: diff changeset	228	if( test->is_If() ) { // Test?
489c9b5090e2 Initial load duke parents: diff changeset	229	Node *ctrl = phase->get_ctrl(test->in(1));
489c9b5090e2 Initial load duke parents: diff changeset	230	if (ctrl->is_top())
489c9b5090e2 Initial load duke parents: diff changeset	231	return false; // Found dead test on live IF? No peeling!
489c9b5090e2 Initial load duke parents: diff changeset	232	// Standard IF only has one input value to check for loop invariance
489c9b5090e2 Initial load duke parents: diff changeset	233	assert( test->Opcode() == Op_If \|\| test->Opcode() == Op_CountedLoopEnd, "Check this code when new subtype is added");
489c9b5090e2 Initial load duke parents: diff changeset	234	// Condition is not a member of this loop?
489c9b5090e2 Initial load duke parents: diff changeset	235	if( !is_member(phase->get_loop(ctrl)) &&
489c9b5090e2 Initial load duke parents: diff changeset	236	is_loop_exit(test) )
489c9b5090e2 Initial load duke parents: diff changeset	237	return true; // Found reason to peel!
489c9b5090e2 Initial load duke parents: diff changeset	238	}
489c9b5090e2 Initial load duke parents: diff changeset	239	// Walk up dominators to loop _head looking for test which is
489c9b5090e2 Initial load duke parents: diff changeset	240	// executed on every path thru loop.
489c9b5090e2 Initial load duke parents: diff changeset	241	test = phase->idom(test);
489c9b5090e2 Initial load duke parents: diff changeset	242	}
489c9b5090e2 Initial load duke parents: diff changeset	243	return false;
489c9b5090e2 Initial load duke parents: diff changeset	244	}
489c9b5090e2 Initial load duke parents: diff changeset	245
489c9b5090e2 Initial load duke parents: diff changeset	246	//------------------------------peeled_dom_test_elim---------------------------
489c9b5090e2 Initial load duke parents: diff changeset	247	// If we got the effect of peeling, either by actually peeling or by making
489c9b5090e2 Initial load duke parents: diff changeset	248	// a pre-loop which must execute at least once, we can remove all
489c9b5090e2 Initial load duke parents: diff changeset	249	// loop-invariant dominated tests in the main body.
489c9b5090e2 Initial load duke parents: diff changeset	250	void PhaseIdealLoop::peeled_dom_test_elim( IdealLoopTree *loop, Node_List &old_new ) {
489c9b5090e2 Initial load duke parents: diff changeset	251	bool progress = true;
489c9b5090e2 Initial load duke parents: diff changeset	252	while( progress ) {
489c9b5090e2 Initial load duke parents: diff changeset	253	progress = false; // Reset for next iteration
489c9b5090e2 Initial load duke parents: diff changeset	254	Node *prev = loop->_head->in(LoopNode::LoopBackControl);//loop->tail();
489c9b5090e2 Initial load duke parents: diff changeset	255	Node *test = prev->in(0);
489c9b5090e2 Initial load duke parents: diff changeset	256	while( test != loop->_head ) { // Scan till run off top of loop
489c9b5090e2 Initial load duke parents: diff changeset	257
489c9b5090e2 Initial load duke parents: diff changeset	258	int p_op = prev->Opcode();
489c9b5090e2 Initial load duke parents: diff changeset	259	if( (p_op == Op_IfFalse \|\| p_op == Op_IfTrue) &&
489c9b5090e2 Initial load duke parents: diff changeset	260	test->is_If() && // Test?
489c9b5090e2 Initial load duke parents: diff changeset	261	!test->in(1)->is_Con() && // And not already obvious?
489c9b5090e2 Initial load duke parents: diff changeset	262	// Condition is not a member of this loop?
489c9b5090e2 Initial load duke parents: diff changeset	263	!loop->is_member(get_loop(get_ctrl(test->in(1))))){
489c9b5090e2 Initial load duke parents: diff changeset	264	// Walk loop body looking for instances of this test
489c9b5090e2 Initial load duke parents: diff changeset	265	for( uint i = 0; i < loop->_body.size(); i++ ) {
489c9b5090e2 Initial load duke parents: diff changeset	266	Node *n = loop->_body.at(i);
489c9b5090e2 Initial load duke parents: diff changeset	267	if( n->is_If() && n->in(1) == test->in(1) /&& n != loop->tail()->in(0)/ ) {
489c9b5090e2 Initial load duke parents: diff changeset	268	// IfNode was dominated by version in peeled loop body
489c9b5090e2 Initial load duke parents: diff changeset	269	progress = true;
489c9b5090e2 Initial load duke parents: diff changeset	270	dominated_by( old_new[prev->_idx], n );
489c9b5090e2 Initial load duke parents: diff changeset	271	}
489c9b5090e2 Initial load duke parents: diff changeset	272	}
489c9b5090e2 Initial load duke parents: diff changeset	273	}
489c9b5090e2 Initial load duke parents: diff changeset	274	prev = test;
489c9b5090e2 Initial load duke parents: diff changeset	275	test = idom(test);
489c9b5090e2 Initial load duke parents: diff changeset	276	} // End of scan tests in loop
489c9b5090e2 Initial load duke parents: diff changeset	277
489c9b5090e2 Initial load duke parents: diff changeset	278	} // End of while( progress )
489c9b5090e2 Initial load duke parents: diff changeset	279	}
489c9b5090e2 Initial load duke parents: diff changeset	280
489c9b5090e2 Initial load duke parents: diff changeset	281	//------------------------------do_peeling-------------------------------------
489c9b5090e2 Initial load duke parents: diff changeset	282	// Peel the first iteration of the given loop.
489c9b5090e2 Initial load duke parents: diff changeset	283	// Step 1: Clone the loop body. The clone becomes the peeled iteration.
489c9b5090e2 Initial load duke parents: diff changeset	284	// The pre-loop illegally has 2 control users (old & new loops).
489c9b5090e2 Initial load duke parents: diff changeset	285	// Step 2: Make the old-loop fall-in edges point to the peeled iteration.
489c9b5090e2 Initial load duke parents: diff changeset	286	// Do this by making the old-loop fall-in edges act as if they came
489c9b5090e2 Initial load duke parents: diff changeset	287	// around the loopback from the prior iteration (follow the old-loop
489c9b5090e2 Initial load duke parents: diff changeset	288	// backedges) and then map to the new peeled iteration. This leaves
489c9b5090e2 Initial load duke parents: diff changeset	289	// the pre-loop with only 1 user (the new peeled iteration), but the
489c9b5090e2 Initial load duke parents: diff changeset	290	// peeled-loop backedge has 2 users.
489c9b5090e2 Initial load duke parents: diff changeset	291	// Step 3: Cut the backedge on the clone (so its not a loop) and remove the
489c9b5090e2 Initial load duke parents: diff changeset	292	// extra backedge user.
489c9b5090e2 Initial load duke parents: diff changeset	293	void PhaseIdealLoop::do_peeling( IdealLoopTree *loop, Node_List &old_new ) {
489c9b5090e2 Initial load duke parents: diff changeset	294
489c9b5090e2 Initial load duke parents: diff changeset	295	C->set_major_progress();
489c9b5090e2 Initial load duke parents: diff changeset	296	// Peeling a 'main' loop in a pre/main/post situation obfuscates the
489c9b5090e2 Initial load duke parents: diff changeset	297	// 'pre' loop from the main and the 'pre' can no longer have it's
489c9b5090e2 Initial load duke parents: diff changeset	298	// iterations adjusted. Therefore, we need to declare this loop as
489c9b5090e2 Initial load duke parents: diff changeset	299	// no longer a 'main' loop; it will need new pre and post loops before
489c9b5090e2 Initial load duke parents: diff changeset	300	// we can do further RCE.
489c9b5090e2 Initial load duke parents: diff changeset	301	Node *h = loop->_head;
489c9b5090e2 Initial load duke parents: diff changeset	302	if( h->is_CountedLoop() ) {
489c9b5090e2 Initial load duke parents: diff changeset	303	CountedLoopNode *cl = h->as_CountedLoop();
489c9b5090e2 Initial load duke parents: diff changeset	304	assert(cl->trip_count() > 0, "peeling a fully unrolled loop");
489c9b5090e2 Initial load duke parents: diff changeset	305	cl->set_trip_count(cl->trip_count() - 1);
489c9b5090e2 Initial load duke parents: diff changeset	306	if( cl->is_main_loop() ) {
489c9b5090e2 Initial load duke parents: diff changeset	307	cl->set_normal_loop();
489c9b5090e2 Initial load duke parents: diff changeset	308	#ifndef PRODUCT
489c9b5090e2 Initial load duke parents: diff changeset	309	if( PrintOpto && VerifyLoopOptimizations ) {
489c9b5090e2 Initial load duke parents: diff changeset	310	tty->print("Peeling a 'main' loop; resetting to 'normal' ");
489c9b5090e2 Initial load duke parents: diff changeset	311	loop->dump_head();
489c9b5090e2 Initial load duke parents: diff changeset	312	}
489c9b5090e2 Initial load duke parents: diff changeset	313	#endif
489c9b5090e2 Initial load duke parents: diff changeset	314	}
489c9b5090e2 Initial load duke parents: diff changeset	315	}
489c9b5090e2 Initial load duke parents: diff changeset	316
489c9b5090e2 Initial load duke parents: diff changeset	317	// Step 1: Clone the loop body. The clone becomes the peeled iteration.
489c9b5090e2 Initial load duke parents: diff changeset	318	// The pre-loop illegally has 2 control users (old & new loops).
489c9b5090e2 Initial load duke parents: diff changeset	319	clone_loop( loop, old_new, dom_depth(loop->_head) );
489c9b5090e2 Initial load duke parents: diff changeset	320
489c9b5090e2 Initial load duke parents: diff changeset	321
489c9b5090e2 Initial load duke parents: diff changeset	322	// Step 2: Make the old-loop fall-in edges point to the peeled iteration.
489c9b5090e2 Initial load duke parents: diff changeset	323	// Do this by making the old-loop fall-in edges act as if they came
489c9b5090e2 Initial load duke parents: diff changeset	324	// around the loopback from the prior iteration (follow the old-loop
489c9b5090e2 Initial load duke parents: diff changeset	325	// backedges) and then map to the new peeled iteration. This leaves
489c9b5090e2 Initial load duke parents: diff changeset	326	// the pre-loop with only 1 user (the new peeled iteration), but the
489c9b5090e2 Initial load duke parents: diff changeset	327	// peeled-loop backedge has 2 users.
489c9b5090e2 Initial load duke parents: diff changeset	328	for (DUIterator_Fast jmax, j = loop->_head->fast_outs(jmax); j < jmax; j++) {
489c9b5090e2 Initial load duke parents: diff changeset	329	Node* old = loop->_head->fast_out(j);
489c9b5090e2 Initial load duke parents: diff changeset	330	if( old->in(0) == loop->_head && old->req() == 3 &&
489c9b5090e2 Initial load duke parents: diff changeset	331	(old->is_Loop() \|\| old->is_Phi()) ) {
489c9b5090e2 Initial load duke parents: diff changeset	332	Node *new_exit_value = old_new[old->in(LoopNode::LoopBackControl)->_idx];
489c9b5090e2 Initial load duke parents: diff changeset	333	if( !new_exit_value ) // Backedge value is ALSO loop invariant?
489c9b5090e2 Initial load duke parents: diff changeset	334	// Then loop body backedge value remains the same.
489c9b5090e2 Initial load duke parents: diff changeset	335	new_exit_value = old->in(LoopNode::LoopBackControl);
489c9b5090e2 Initial load duke parents: diff changeset	336	_igvn.hash_delete(old);
489c9b5090e2 Initial load duke parents: diff changeset	337	old->set_req(LoopNode::EntryControl, new_exit_value);
489c9b5090e2 Initial load duke parents: diff changeset	338	}
489c9b5090e2 Initial load duke parents: diff changeset	339	}
489c9b5090e2 Initial load duke parents: diff changeset	340
489c9b5090e2 Initial load duke parents: diff changeset	341
489c9b5090e2 Initial load duke parents: diff changeset	342	// Step 3: Cut the backedge on the clone (so its not a loop) and remove the
489c9b5090e2 Initial load duke parents: diff changeset	343	// extra backedge user.
489c9b5090e2 Initial load duke parents: diff changeset	344	Node *nnn = old_new[loop->_head->_idx];
489c9b5090e2 Initial load duke parents: diff changeset	345	_igvn.hash_delete(nnn);
489c9b5090e2 Initial load duke parents: diff changeset	346	nnn->set_req(LoopNode::LoopBackControl, C->top());
489c9b5090e2 Initial load duke parents: diff changeset	347	for (DUIterator_Fast j2max, j2 = nnn->fast_outs(j2max); j2 < j2max; j2++) {
489c9b5090e2 Initial load duke parents: diff changeset	348	Node* use = nnn->fast_out(j2);
489c9b5090e2 Initial load duke parents: diff changeset	349	if( use->in(0) == nnn && use->req() == 3 && use->is_Phi() ) {
489c9b5090e2 Initial load duke parents: diff changeset	350	_igvn.hash_delete(use);
489c9b5090e2 Initial load duke parents: diff changeset	351	use->set_req(LoopNode::LoopBackControl, C->top());
489c9b5090e2 Initial load duke parents: diff changeset	352	}
489c9b5090e2 Initial load duke parents: diff changeset	353	}
489c9b5090e2 Initial load duke parents: diff changeset	354
489c9b5090e2 Initial load duke parents: diff changeset	355
489c9b5090e2 Initial load duke parents: diff changeset	356	// Step 4: Correct dom-depth info. Set to loop-head depth.
489c9b5090e2 Initial load duke parents: diff changeset	357	int dd = dom_depth(loop->_head);
489c9b5090e2 Initial load duke parents: diff changeset	358	set_idom(loop->_head, loop->_head->in(1), dd);
489c9b5090e2 Initial load duke parents: diff changeset	359	for (uint j3 = 0; j3 < loop->_body.size(); j3++) {
489c9b5090e2 Initial load duke parents: diff changeset	360	Node *old = loop->_body.at(j3);
489c9b5090e2 Initial load duke parents: diff changeset	361	Node *nnn = old_new[old->_idx];
489c9b5090e2 Initial load duke parents: diff changeset	362	if (!has_ctrl(nnn))
489c9b5090e2 Initial load duke parents: diff changeset	363	set_idom(nnn, idom(nnn), dd-1);
489c9b5090e2 Initial load duke parents: diff changeset	364	// While we're at it, remove any SafePoints from the peeled code
489c9b5090e2 Initial load duke parents: diff changeset	365	if( old->Opcode() == Op_SafePoint ) {
489c9b5090e2 Initial load duke parents: diff changeset	366	Node *nnn = old_new[old->_idx];
489c9b5090e2 Initial load duke parents: diff changeset	367	lazy_replace(nnn,nnn->in(TypeFunc::Control));
489c9b5090e2 Initial load duke parents: diff changeset	368	}
489c9b5090e2 Initial load duke parents: diff changeset	369	}
489c9b5090e2 Initial load duke parents: diff changeset	370
489c9b5090e2 Initial load duke parents: diff changeset	371	// Now force out all loop-invariant dominating tests. The optimizer
489c9b5090e2 Initial load duke parents: diff changeset	372	// finds some, but we _know_ they are all useless.
489c9b5090e2 Initial load duke parents: diff changeset	373	peeled_dom_test_elim(loop,old_new);
489c9b5090e2 Initial load duke parents: diff changeset	374
489c9b5090e2 Initial load duke parents: diff changeset	375	loop->record_for_igvn();
489c9b5090e2 Initial load duke parents: diff changeset	376	}
489c9b5090e2 Initial load duke parents: diff changeset	377
489c9b5090e2 Initial load duke parents: diff changeset	378	//------------------------------policy_maximally_unroll------------------------
489c9b5090e2 Initial load duke parents: diff changeset	379	// Return exact loop trip count, or 0 if not maximally unrolling
489c9b5090e2 Initial load duke parents: diff changeset	380	bool IdealLoopTree::policy_maximally_unroll( PhaseIdealLoop *phase ) const {
489c9b5090e2 Initial load duke parents: diff changeset	381	CountedLoopNode *cl = _head->as_CountedLoop();
489c9b5090e2 Initial load duke parents: diff changeset	382	assert( cl->is_normal_loop(), "" );
489c9b5090e2 Initial load duke parents: diff changeset	383
489c9b5090e2 Initial load duke parents: diff changeset	384	Node *init_n = cl->init_trip();
489c9b5090e2 Initial load duke parents: diff changeset	385	Node *limit_n = cl->limit();
489c9b5090e2 Initial load duke parents: diff changeset	386
489c9b5090e2 Initial load duke parents: diff changeset	387	// Non-constant bounds
489c9b5090e2 Initial load duke parents: diff changeset	388	if( init_n == NULL \|\| !init_n->is_Con() \|\|
489c9b5090e2 Initial load duke parents: diff changeset	389	limit_n == NULL \|\| !limit_n->is_Con() \|\|
489c9b5090e2 Initial load duke parents: diff changeset	390	// protect against stride not being a constant
489c9b5090e2 Initial load duke parents: diff changeset	391	!cl->stride_is_con() ) {
489c9b5090e2 Initial load duke parents: diff changeset	392	return false;
489c9b5090e2 Initial load duke parents: diff changeset	393	}
489c9b5090e2 Initial load duke parents: diff changeset	394	int init = init_n->get_int();
489c9b5090e2 Initial load duke parents: diff changeset	395	int limit = limit_n->get_int();
489c9b5090e2 Initial load duke parents: diff changeset	396	int span = limit - init;
489c9b5090e2 Initial load duke parents: diff changeset	397	int stride = cl->stride_con();
489c9b5090e2 Initial load duke parents: diff changeset	398
489c9b5090e2 Initial load duke parents: diff changeset	399	if (init >= limit \|\| stride > span) {
489c9b5090e2 Initial load duke parents: diff changeset	400	// return a false (no maximally unroll) and the regular unroll/peel
489c9b5090e2 Initial load duke parents: diff changeset	401	// route will make a small mess which CCP will fold away.
489c9b5090e2 Initial load duke parents: diff changeset	402	return false;
489c9b5090e2 Initial load duke parents: diff changeset	403	}
489c9b5090e2 Initial load duke parents: diff changeset	404	uint trip_count = span/stride; // trip_count can be greater than 2 Gig.
489c9b5090e2 Initial load duke parents: diff changeset	405	assert( (int)trip_count*stride == span, "must divide evenly" );
489c9b5090e2 Initial load duke parents: diff changeset	406
489c9b5090e2 Initial load duke parents: diff changeset	407	// Real policy: if we maximally unroll, does it get too big?
489c9b5090e2 Initial load duke parents: diff changeset	408	// Allow the unrolled mess to get larger than standard loop
489c9b5090e2 Initial load duke parents: diff changeset	409	// size. After all, it will no longer be a loop.
489c9b5090e2 Initial load duke parents: diff changeset	410	uint body_size = _body.size();
489c9b5090e2 Initial load duke parents: diff changeset	411	uint unroll_limit = (uint)LoopUnrollLimit * 4;
489c9b5090e2 Initial load duke parents: diff changeset	412	assert( (intx)unroll_limit == LoopUnrollLimit * 4, "LoopUnrollLimit must fit in 32bits");
489c9b5090e2 Initial load duke parents: diff changeset	413	cl->set_trip_count(trip_count);
489c9b5090e2 Initial load duke parents: diff changeset	414	if( trip_count <= unroll_limit && body_size <= unroll_limit ) {
489c9b5090e2 Initial load duke parents: diff changeset	415	uint new_body_size = body_size * trip_count;
489c9b5090e2 Initial load duke parents: diff changeset	416	if (new_body_size <= unroll_limit &&
489c9b5090e2 Initial load duke parents: diff changeset	417	body_size == new_body_size / trip_count &&
489c9b5090e2 Initial load duke parents: diff changeset	418	// Unrolling can result in a large amount of node construction
489c9b5090e2 Initial load duke parents: diff changeset	419	new_body_size < MaxNodeLimit - phase->C->unique()) {
489c9b5090e2 Initial load duke parents: diff changeset	420	return true; // maximally unroll
489c9b5090e2 Initial load duke parents: diff changeset	421	}
489c9b5090e2 Initial load duke parents: diff changeset	422	}
489c9b5090e2 Initial load duke parents: diff changeset	423
489c9b5090e2 Initial load duke parents: diff changeset	424	return false; // Do not maximally unroll
489c9b5090e2 Initial load duke parents: diff changeset	425	}
489c9b5090e2 Initial load duke parents: diff changeset	426
489c9b5090e2 Initial load duke parents: diff changeset	427
489c9b5090e2 Initial load duke parents: diff changeset	428	//------------------------------policy_unroll----------------------------------
489c9b5090e2 Initial load duke parents: diff changeset	429	// Return TRUE or FALSE if the loop should be unrolled or not. Unroll if
489c9b5090e2 Initial load duke parents: diff changeset	430	// the loop is a CountedLoop and the body is small enough.
489c9b5090e2 Initial load duke parents: diff changeset	431	bool IdealLoopTree::policy_unroll( PhaseIdealLoop *phase ) const {
489c9b5090e2 Initial load duke parents: diff changeset	432
489c9b5090e2 Initial load duke parents: diff changeset	433	CountedLoopNode *cl = _head->as_CountedLoop();
489c9b5090e2 Initial load duke parents: diff changeset	434	assert( cl->is_normal_loop() \|\| cl->is_main_loop(), "" );
489c9b5090e2 Initial load duke parents: diff changeset	435
489c9b5090e2 Initial load duke parents: diff changeset	436	// protect against stride not being a constant
489c9b5090e2 Initial load duke parents: diff changeset	437	if( !cl->stride_is_con() ) return false;
489c9b5090e2 Initial load duke parents: diff changeset	438
489c9b5090e2 Initial load duke parents: diff changeset	439	// protect against over-unrolling
489c9b5090e2 Initial load duke parents: diff changeset	440	if( cl->trip_count() <= 1 ) return false;
489c9b5090e2 Initial load duke parents: diff changeset	441
489c9b5090e2 Initial load duke parents: diff changeset	442	int future_unroll_ct = cl->unrolled_count() * 2;
489c9b5090e2 Initial load duke parents: diff changeset	443
489c9b5090e2 Initial load duke parents: diff changeset	444	// Don't unroll if the next round of unrolling would push us
489c9b5090e2 Initial load duke parents: diff changeset	445	// over the expected trip count of the loop. One is subtracted
489c9b5090e2 Initial load duke parents: diff changeset	446	// from the expected trip count because the pre-loop normally
489c9b5090e2 Initial load duke parents: diff changeset	447	// executes 1 iteration.
489c9b5090e2 Initial load duke parents: diff changeset	448	if (UnrollLimitForProfileCheck > 0 &&
489c9b5090e2 Initial load duke parents: diff changeset	449	cl->profile_trip_cnt() != COUNT_UNKNOWN &&
489c9b5090e2 Initial load duke parents: diff changeset	450	future_unroll_ct > UnrollLimitForProfileCheck &&
489c9b5090e2 Initial load duke parents: diff changeset	451	(float)future_unroll_ct > cl->profile_trip_cnt() - 1.0) {
489c9b5090e2 Initial load duke parents: diff changeset	452	return false;
489c9b5090e2 Initial load duke parents: diff changeset	453	}
489c9b5090e2 Initial load duke parents: diff changeset	454
489c9b5090e2 Initial load duke parents: diff changeset	455	// When unroll count is greater than LoopUnrollMin, don't unroll if:
489c9b5090e2 Initial load duke parents: diff changeset	456	// the residual iterations are more than 10% of the trip count
489c9b5090e2 Initial load duke parents: diff changeset	457	// and rounds of "unroll,optimize" are not making significant progress
489c9b5090e2 Initial load duke parents: diff changeset	458	// Progress defined as current size less than 20% larger than previous size.
489c9b5090e2 Initial load duke parents: diff changeset	459	if (UseSuperWord && cl->node_count_before_unroll() > 0 &&
489c9b5090e2 Initial load duke parents: diff changeset	460	future_unroll_ct > LoopUnrollMin &&
489c9b5090e2 Initial load duke parents: diff changeset	461	(future_unroll_ct - 1) * 10.0 > cl->profile_trip_cnt() &&
489c9b5090e2 Initial load duke parents: diff changeset	462	1.2 * cl->node_count_before_unroll() < (double)_body.size()) {
489c9b5090e2 Initial load duke parents: diff changeset	463	return false;
489c9b5090e2 Initial load duke parents: diff changeset	464	}
489c9b5090e2 Initial load duke parents: diff changeset	465
489c9b5090e2 Initial load duke parents: diff changeset	466	Node *init_n = cl->init_trip();
489c9b5090e2 Initial load duke parents: diff changeset	467	Node *limit_n = cl->limit();
489c9b5090e2 Initial load duke parents: diff changeset	468	// Non-constant bounds.
489c9b5090e2 Initial load duke parents: diff changeset	469	// Protect against over-unrolling when init or/and limit are not constant
489c9b5090e2 Initial load duke parents: diff changeset	470	// (so that trip_count's init value is maxint) but iv range is known.
489c9b5090e2 Initial load duke parents: diff changeset	471	if( init_n == NULL \|\| !init_n->is_Con() \|\|
489c9b5090e2 Initial load duke parents: diff changeset	472	limit_n == NULL \|\| !limit_n->is_Con() ) {
489c9b5090e2 Initial load duke parents: diff changeset	473	Node* phi = cl->phi();
489c9b5090e2 Initial load duke parents: diff changeset	474	if( phi != NULL ) {
489c9b5090e2 Initial load duke parents: diff changeset	475	assert(phi->is_Phi() && phi->in(0) == _head, "Counted loop should have iv phi.");
489c9b5090e2 Initial load duke parents: diff changeset	476	const TypeInt* iv_type = phase->_igvn.type(phi)->is_int();
489c9b5090e2 Initial load duke parents: diff changeset	477	int next_stride = cl->stride_con() * 2; // stride after this unroll
489c9b5090e2 Initial load duke parents: diff changeset	478	if( next_stride > 0 ) {
489c9b5090e2 Initial load duke parents: diff changeset	479	if( iv_type->_lo + next_stride <= iv_type->_lo \|\| // overflow
489c9b5090e2 Initial load duke parents: diff changeset	480	iv_type->_lo + next_stride > iv_type->_hi ) {
489c9b5090e2 Initial load duke parents: diff changeset	481	return false; // over-unrolling
489c9b5090e2 Initial load duke parents: diff changeset	482	}
489c9b5090e2 Initial load duke parents: diff changeset	483	} else if( next_stride < 0 ) {
489c9b5090e2 Initial load duke parents: diff changeset	484	if( iv_type->_hi + next_stride >= iv_type->_hi \|\| // overflow
489c9b5090e2 Initial load duke parents: diff changeset	485	iv_type->_hi + next_stride < iv_type->_lo ) {
489c9b5090e2 Initial load duke parents: diff changeset	486	return false; // over-unrolling
489c9b5090e2 Initial load duke parents: diff changeset	487	}
489c9b5090e2 Initial load duke parents: diff changeset	488	}
489c9b5090e2 Initial load duke parents: diff changeset	489	}
489c9b5090e2 Initial load duke parents: diff changeset	490	}
489c9b5090e2 Initial load duke parents: diff changeset	491
489c9b5090e2 Initial load duke parents: diff changeset	492	// Adjust body_size to determine if we unroll or not
489c9b5090e2 Initial load duke parents: diff changeset	493	uint body_size = _body.size();
489c9b5090e2 Initial load duke parents: diff changeset	494	// Key test to unroll CaffeineMark's Logic test
489c9b5090e2 Initial load duke parents: diff changeset	495	int xors_in_loop = 0;
489c9b5090e2 Initial load duke parents: diff changeset	496	// Also count ModL, DivL and MulL which expand mightly
489c9b5090e2 Initial load duke parents: diff changeset	497	for( uint k = 0; k < _body.size(); k++ ) {
489c9b5090e2 Initial load duke parents: diff changeset	498	switch( _body.at(k)->Opcode() ) {
489c9b5090e2 Initial load duke parents: diff changeset	499	case Op_XorI: xors_in_loop++; break; // CaffeineMark's Logic test
489c9b5090e2 Initial load duke parents: diff changeset	500	case Op_ModL: body_size += 30; break;
489c9b5090e2 Initial load duke parents: diff changeset	501	case Op_DivL: body_size += 30; break;
489c9b5090e2 Initial load duke parents: diff changeset	502	case Op_MulL: body_size += 10; break;
489c9b5090e2 Initial load duke parents: diff changeset	503	}
489c9b5090e2 Initial load duke parents: diff changeset	504	}
489c9b5090e2 Initial load duke parents: diff changeset	505
489c9b5090e2 Initial load duke parents: diff changeset	506	// Check for being too big
489c9b5090e2 Initial load duke parents: diff changeset	507	if( body_size > (uint)LoopUnrollLimit ) {
489c9b5090e2 Initial load duke parents: diff changeset	508	if( xors_in_loop >= 4 && body_size < (uint)LoopUnrollLimit*4) return true;
489c9b5090e2 Initial load duke parents: diff changeset	509	// Normal case: loop too big
489c9b5090e2 Initial load duke parents: diff changeset	510	return false;
489c9b5090e2 Initial load duke parents: diff changeset	511	}
489c9b5090e2 Initial load duke parents: diff changeset	512
489c9b5090e2 Initial load duke parents: diff changeset	513	// Check for stride being a small enough constant
489c9b5090e2 Initial load duke parents: diff changeset	514	if( abs(cl->stride_con()) > (1<<3) ) return false;
489c9b5090e2 Initial load duke parents: diff changeset	515
489c9b5090e2 Initial load duke parents: diff changeset	516	// Unroll once! (Each trip will soon do double iterations)
489c9b5090e2 Initial load duke parents: diff changeset	517	return true;
489c9b5090e2 Initial load duke parents: diff changeset	518	}
489c9b5090e2 Initial load duke parents: diff changeset	519
489c9b5090e2 Initial load duke parents: diff changeset	520	//------------------------------policy_align-----------------------------------
489c9b5090e2 Initial load duke parents: diff changeset	521	// Return TRUE or FALSE if the loop should be cache-line aligned. Gather the
489c9b5090e2 Initial load duke parents: diff changeset	522	// expression that does the alignment. Note that only one array base can be
489c9b5090e2 Initial load duke parents: diff changeset	523	// aligned in a loop (unless the VM guarentees mutual alignment). Note that
489c9b5090e2 Initial load duke parents: diff changeset	524	// if we vectorize short memory ops into longer memory ops, we may want to
489c9b5090e2 Initial load duke parents: diff changeset	525	// increase alignment.
489c9b5090e2 Initial load duke parents: diff changeset	526	bool IdealLoopTree::policy_align( PhaseIdealLoop *phase ) const {
489c9b5090e2 Initial load duke parents: diff changeset	527	return false;
489c9b5090e2 Initial load duke parents: diff changeset	528	}
489c9b5090e2 Initial load duke parents: diff changeset	529
489c9b5090e2 Initial load duke parents: diff changeset	530	//------------------------------policy_range_check-----------------------------
489c9b5090e2 Initial load duke parents: diff changeset	531	// Return TRUE or FALSE if the loop should be range-check-eliminated.
489c9b5090e2 Initial load duke parents: diff changeset	532	// Actually we do iteration-splitting, a more powerful form of RCE.
489c9b5090e2 Initial load duke parents: diff changeset	533	bool IdealLoopTree::policy_range_check( PhaseIdealLoop *phase ) const {
489c9b5090e2 Initial load duke parents: diff changeset	534	if( !RangeCheckElimination ) return false;
489c9b5090e2 Initial load duke parents: diff changeset	535
489c9b5090e2 Initial load duke parents: diff changeset	536	CountedLoopNode *cl = _head->as_CountedLoop();
489c9b5090e2 Initial load duke parents: diff changeset	537	// If we unrolled with no intention of doing RCE and we later
489c9b5090e2 Initial load duke parents: diff changeset	538	// changed our minds, we got no pre-loop. Either we need to
489c9b5090e2 Initial load duke parents: diff changeset	539	// make a new pre-loop, or we gotta disallow RCE.
489c9b5090e2 Initial load duke parents: diff changeset	540	if( cl->is_main_no_pre_loop() ) return false; // Disallowed for now.
489c9b5090e2 Initial load duke parents: diff changeset	541	Node *trip_counter = cl->phi();
489c9b5090e2 Initial load duke parents: diff changeset	542
489c9b5090e2 Initial load duke parents: diff changeset	543	// Check loop body for tests of trip-counter plus loop-invariant vs
489c9b5090e2 Initial load duke parents: diff changeset	544	// loop-invariant.
489c9b5090e2 Initial load duke parents: diff changeset	545	for( uint i = 0; i < _body.size(); i++ ) {
489c9b5090e2 Initial load duke parents: diff changeset	546	Node *iff = _body[i];
489c9b5090e2 Initial load duke parents: diff changeset	547	if( iff->Opcode() == Op_If ) { // Test?
489c9b5090e2 Initial load duke parents: diff changeset	548
489c9b5090e2 Initial load duke parents: diff changeset	549	// Comparing trip+off vs limit
489c9b5090e2 Initial load duke parents: diff changeset	550	Node *bol = iff->in(1);
489c9b5090e2 Initial load duke parents: diff changeset	551	if( bol->req() != 2 ) continue; // dead constant test
489c9b5090e2 Initial load duke parents: diff changeset	552	Node *cmp = bol->in(1);
489c9b5090e2 Initial load duke parents: diff changeset	553
489c9b5090e2 Initial load duke parents: diff changeset	554	Node *rc_exp = cmp->in(1);
489c9b5090e2 Initial load duke parents: diff changeset	555	Node *limit = cmp->in(2);
489c9b5090e2 Initial load duke parents: diff changeset	556
489c9b5090e2 Initial load duke parents: diff changeset	557	Node *limit_c = phase->get_ctrl(limit);
489c9b5090e2 Initial load duke parents: diff changeset	558	if( limit_c == phase->C->top() )
489c9b5090e2 Initial load duke parents: diff changeset	559	return false; // Found dead test on live IF? No RCE!
489c9b5090e2 Initial load duke parents: diff changeset	560	if( is_member(phase->get_loop(limit_c) ) ) {
489c9b5090e2 Initial load duke parents: diff changeset	561	// Compare might have operands swapped; commute them
489c9b5090e2 Initial load duke parents: diff changeset	562	rc_exp = cmp->in(2);
489c9b5090e2 Initial load duke parents: diff changeset	563	limit = cmp->in(1);
489c9b5090e2 Initial load duke parents: diff changeset	564	limit_c = phase->get_ctrl(limit);
489c9b5090e2 Initial load duke parents: diff changeset	565	if( is_member(phase->get_loop(limit_c) ) )
489c9b5090e2 Initial load duke parents: diff changeset	566	continue; // Both inputs are loop varying; cannot RCE
489c9b5090e2 Initial load duke parents: diff changeset	567	}
489c9b5090e2 Initial load duke parents: diff changeset	568
489c9b5090e2 Initial load duke parents: diff changeset	569	if (!phase->is_scaled_iv_plus_offset(rc_exp, trip_counter, NULL, NULL)) {
489c9b5090e2 Initial load duke parents: diff changeset	570	continue;
489c9b5090e2 Initial load duke parents: diff changeset	571	}
489c9b5090e2 Initial load duke parents: diff changeset	572	// Yeah! Found a test like 'trip+off vs limit'
489c9b5090e2 Initial load duke parents: diff changeset	573	// Test is an IfNode, has 2 projections. If BOTH are in the loop
489c9b5090e2 Initial load duke parents: diff changeset	574	// we need loop unswitching instead of iteration splitting.
489c9b5090e2 Initial load duke parents: diff changeset	575	if( is_loop_exit(iff) )
489c9b5090e2 Initial load duke parents: diff changeset	576	return true; // Found reason to split iterations
489c9b5090e2 Initial load duke parents: diff changeset	577	} // End of is IF
489c9b5090e2 Initial load duke parents: diff changeset	578	}
489c9b5090e2 Initial load duke parents: diff changeset	579
489c9b5090e2 Initial load duke parents: diff changeset	580	return false;
489c9b5090e2 Initial load duke parents: diff changeset	581	}
489c9b5090e2 Initial load duke parents: diff changeset	582
489c9b5090e2 Initial load duke parents: diff changeset	583	//------------------------------policy_peel_only-------------------------------
489c9b5090e2 Initial load duke parents: diff changeset	584	// Return TRUE or FALSE if the loop should NEVER be RCE'd or aligned. Useful
489c9b5090e2 Initial load duke parents: diff changeset	585	// for unrolling loops with NO array accesses.
489c9b5090e2 Initial load duke parents: diff changeset	586	bool IdealLoopTree::policy_peel_only( PhaseIdealLoop *phase ) const {
489c9b5090e2 Initial load duke parents: diff changeset	587
489c9b5090e2 Initial load duke parents: diff changeset	588	for( uint i = 0; i < _body.size(); i++ )
489c9b5090e2 Initial load duke parents: diff changeset	589	if( _body[i]->is_Mem() )
489c9b5090e2 Initial load duke parents: diff changeset	590	return false;
489c9b5090e2 Initial load duke parents: diff changeset	591
489c9b5090e2 Initial load duke parents: diff changeset	592	// No memory accesses at all!
489c9b5090e2 Initial load duke parents: diff changeset	593	return true;
489c9b5090e2 Initial load duke parents: diff changeset	594	}
489c9b5090e2 Initial load duke parents: diff changeset	595
489c9b5090e2 Initial load duke parents: diff changeset	596	//------------------------------clone_up_backedge_goo--------------------------
489c9b5090e2 Initial load duke parents: diff changeset	597	// If Node n lives in the back_ctrl block and cannot float, we clone a private
489c9b5090e2 Initial load duke parents: diff changeset	598	// version of n in preheader_ctrl block and return that, otherwise return n.
489c9b5090e2 Initial load duke parents: diff changeset	599	Node PhaseIdealLoop::clone_up_backedge_goo( Node back_ctrl, Node preheader_ctrl, Node n ) {
489c9b5090e2 Initial load duke parents: diff changeset	600	if( get_ctrl(n) != back_ctrl ) return n;
489c9b5090e2 Initial load duke parents: diff changeset	601
489c9b5090e2 Initial load duke parents: diff changeset	602	Node *x = NULL; // If required, a clone of 'n'
489c9b5090e2 Initial load duke parents: diff changeset	603	// Check for 'n' being pinned in the backedge.
489c9b5090e2 Initial load duke parents: diff changeset	604	if( n->in(0) && n->in(0) == back_ctrl ) {
489c9b5090e2 Initial load duke parents: diff changeset	605	x = n->clone(); // Clone a copy of 'n' to preheader
489c9b5090e2 Initial load duke parents: diff changeset	606	x->set_req( 0, preheader_ctrl ); // Fix x's control input to preheader
489c9b5090e2 Initial load duke parents: diff changeset	607	}
489c9b5090e2 Initial load duke parents: diff changeset	608
489c9b5090e2 Initial load duke parents: diff changeset	609	// Recursive fixup any other input edges into x.
489c9b5090e2 Initial load duke parents: diff changeset	610	// If there are no changes we can just return 'n', otherwise
489c9b5090e2 Initial load duke parents: diff changeset	611	// we need to clone a private copy and change it.
489c9b5090e2 Initial load duke parents: diff changeset	612	for( uint i = 1; i < n->req(); i++ ) {
489c9b5090e2 Initial load duke parents: diff changeset	613	Node *g = clone_up_backedge_goo( back_ctrl, preheader_ctrl, n->in(i) );
489c9b5090e2 Initial load duke parents: diff changeset	614	if( g != n->in(i) ) {
489c9b5090e2 Initial load duke parents: diff changeset	615	if( !x )
489c9b5090e2 Initial load duke parents: diff changeset	616	x = n->clone();
489c9b5090e2 Initial load duke parents: diff changeset	617	x->set_req(i, g);
489c9b5090e2 Initial load duke parents: diff changeset	618	}
489c9b5090e2 Initial load duke parents: diff changeset	619	}
489c9b5090e2 Initial load duke parents: diff changeset	620	if( x ) { // x can legally float to pre-header location
489c9b5090e2 Initial load duke parents: diff changeset	621	register_new_node( x, preheader_ctrl );
489c9b5090e2 Initial load duke parents: diff changeset	622	return x;
489c9b5090e2 Initial load duke parents: diff changeset	623	} else { // raise n to cover LCA of uses
489c9b5090e2 Initial load duke parents: diff changeset	624	set_ctrl( n, find_non_split_ctrl(back_ctrl->in(0)) );
489c9b5090e2 Initial load duke parents: diff changeset	625	}
489c9b5090e2 Initial load duke parents: diff changeset	626	return n;
489c9b5090e2 Initial load duke parents: diff changeset	627	}
489c9b5090e2 Initial load duke parents: diff changeset	628
489c9b5090e2 Initial load duke parents: diff changeset	629	//------------------------------insert_pre_post_loops--------------------------
489c9b5090e2 Initial load duke parents: diff changeset	630	// Insert pre and post loops. If peel_only is set, the pre-loop can not have
489c9b5090e2 Initial load duke parents: diff changeset	631	// more iterations added. It acts as a 'peel' only, no lower-bound RCE, no
489c9b5090e2 Initial load duke parents: diff changeset	632	// alignment. Useful to unroll loops that do no array accesses.
489c9b5090e2 Initial load duke parents: diff changeset	633	void PhaseIdealLoop::insert_pre_post_loops( IdealLoopTree *loop, Node_List &old_new, bool peel_only ) {
489c9b5090e2 Initial load duke parents: diff changeset	634
489c9b5090e2 Initial load duke parents: diff changeset	635	C->set_major_progress();
489c9b5090e2 Initial load duke parents: diff changeset	636
489c9b5090e2 Initial load duke parents: diff changeset	637	// Find common pieces of the loop being guarded with pre & post loops
489c9b5090e2 Initial load duke parents: diff changeset	638	CountedLoopNode *main_head = loop->_head->as_CountedLoop();
489c9b5090e2 Initial load duke parents: diff changeset	639	assert( main_head->is_normal_loop(), "" );
489c9b5090e2 Initial load duke parents: diff changeset	640	CountedLoopEndNode *main_end = main_head->loopexit();
489c9b5090e2 Initial load duke parents: diff changeset	641	assert( main_end->outcnt() == 2, "1 true, 1 false path only" );
489c9b5090e2 Initial load duke parents: diff changeset	642	uint dd_main_head = dom_depth(main_head);
489c9b5090e2 Initial load duke parents: diff changeset	643	uint max = main_head->outcnt();
489c9b5090e2 Initial load duke parents: diff changeset	644
489c9b5090e2 Initial load duke parents: diff changeset	645	Node *pre_header= main_head->in(LoopNode::EntryControl);
489c9b5090e2 Initial load duke parents: diff changeset	646	Node *init = main_head->init_trip();
489c9b5090e2 Initial load duke parents: diff changeset	647	Node *incr = main_end ->incr();
489c9b5090e2 Initial load duke parents: diff changeset	648	Node *limit = main_end ->limit();
489c9b5090e2 Initial load duke parents: diff changeset	649	Node *stride = main_end ->stride();
489c9b5090e2 Initial load duke parents: diff changeset	650	Node *cmp = main_end ->cmp_node();
489c9b5090e2 Initial load duke parents: diff changeset	651	BoolTest::mask b_test = main_end->test_trip();
489c9b5090e2 Initial load duke parents: diff changeset	652
489c9b5090e2 Initial load duke parents: diff changeset	653	// Need only 1 user of 'bol' because I will be hacking the loop bounds.
489c9b5090e2 Initial load duke parents: diff changeset	654	Node *bol = main_end->in(CountedLoopEndNode::TestValue);
489c9b5090e2 Initial load duke parents: diff changeset	655	if( bol->outcnt() != 1 ) {
489c9b5090e2 Initial load duke parents: diff changeset	656	bol = bol->clone();
489c9b5090e2 Initial load duke parents: diff changeset	657	register_new_node(bol,main_end->in(CountedLoopEndNode::TestControl));
489c9b5090e2 Initial load duke parents: diff changeset	658	_igvn.hash_delete(main_end);
489c9b5090e2 Initial load duke parents: diff changeset	659	main_end->set_req(CountedLoopEndNode::TestValue, bol);
489c9b5090e2 Initial load duke parents: diff changeset	660	}
489c9b5090e2 Initial load duke parents: diff changeset	661	// Need only 1 user of 'cmp' because I will be hacking the loop bounds.
489c9b5090e2 Initial load duke parents: diff changeset	662	if( cmp->outcnt() != 1 ) {
489c9b5090e2 Initial load duke parents: diff changeset	663	cmp = cmp->clone();
489c9b5090e2 Initial load duke parents: diff changeset	664	register_new_node(cmp,main_end->in(CountedLoopEndNode::TestControl));
489c9b5090e2 Initial load duke parents: diff changeset	665	_igvn.hash_delete(bol);
489c9b5090e2 Initial load duke parents: diff changeset	666	bol->set_req(1, cmp);
489c9b5090e2 Initial load duke parents: diff changeset	667	}
489c9b5090e2 Initial load duke parents: diff changeset	668
489c9b5090e2 Initial load duke parents: diff changeset	669	//------------------------------
489c9b5090e2 Initial load duke parents: diff changeset	670	// Step A: Create Post-Loop.
489c9b5090e2 Initial load duke parents: diff changeset	671	Node* main_exit = main_end->proj_out(false);
489c9b5090e2 Initial load duke parents: diff changeset	672	assert( main_exit->Opcode() == Op_IfFalse, "" );
489c9b5090e2 Initial load duke parents: diff changeset	673	int dd_main_exit = dom_depth(main_exit);
489c9b5090e2 Initial load duke parents: diff changeset	674
489c9b5090e2 Initial load duke parents: diff changeset	675	// Step A1: Clone the loop body. The clone becomes the post-loop. The main
489c9b5090e2 Initial load duke parents: diff changeset	676	// loop pre-header illegally has 2 control users (old & new loops).
489c9b5090e2 Initial load duke parents: diff changeset	677	clone_loop( loop, old_new, dd_main_exit );
489c9b5090e2 Initial load duke parents: diff changeset	678	assert( old_new[main_end ->_idx]->Opcode() == Op_CountedLoopEnd, "" );
489c9b5090e2 Initial load duke parents: diff changeset	679	CountedLoopNode *post_head = old_new[main_head->_idx]->as_CountedLoop();
489c9b5090e2 Initial load duke parents: diff changeset	680	post_head->set_post_loop(main_head);
489c9b5090e2 Initial load duke parents: diff changeset	681
489c9b5090e2 Initial load duke parents: diff changeset	682	// Build the main-loop normal exit.
489c9b5090e2 Initial load duke parents: diff changeset	683	IfFalseNode *new_main_exit = new (C, 1) IfFalseNode(main_end);
489c9b5090e2 Initial load duke parents: diff changeset	684	_igvn.register_new_node_with_optimizer( new_main_exit );
489c9b5090e2 Initial load duke parents: diff changeset	685	set_idom(new_main_exit, main_end, dd_main_exit );
489c9b5090e2 Initial load duke parents: diff changeset	686	set_loop(new_main_exit, loop->_parent);
489c9b5090e2 Initial load duke parents: diff changeset	687
489c9b5090e2 Initial load duke parents: diff changeset	688	// Step A2: Build a zero-trip guard for the post-loop. After leaving the
489c9b5090e2 Initial load duke parents: diff changeset	689	// main-loop, the post-loop may not execute at all. We 'opaque' the incr
489c9b5090e2 Initial load duke parents: diff changeset	690	// (the main-loop trip-counter exit value) because we will be changing
489c9b5090e2 Initial load duke parents: diff changeset	691	// the exit value (via unrolling) so we cannot constant-fold away the zero
489c9b5090e2 Initial load duke parents: diff changeset	692	// trip guard until all unrolling is done.
489c9b5090e2 Initial load duke parents: diff changeset	693	Node *zer_opaq = new (C, 2) Opaque1Node(incr);
489c9b5090e2 Initial load duke parents: diff changeset	694	Node *zer_cmp = new (C, 3) CmpINode( zer_opaq, limit );
489c9b5090e2 Initial load duke parents: diff changeset	695	Node *zer_bol = new (C, 2) BoolNode( zer_cmp, b_test );
489c9b5090e2 Initial load duke parents: diff changeset	696	register_new_node( zer_opaq, new_main_exit );
489c9b5090e2 Initial load duke parents: diff changeset	697	register_new_node( zer_cmp , new_main_exit );
489c9b5090e2 Initial load duke parents: diff changeset	698	register_new_node( zer_bol , new_main_exit );
489c9b5090e2 Initial load duke parents: diff changeset	699
489c9b5090e2 Initial load duke parents: diff changeset	700	// Build the IfNode
489c9b5090e2 Initial load duke parents: diff changeset	701	IfNode *zer_iff = new (C, 2) IfNode( new_main_exit, zer_bol, PROB_FAIR, COUNT_UNKNOWN );
489c9b5090e2 Initial load duke parents: diff changeset	702	_igvn.register_new_node_with_optimizer( zer_iff );
489c9b5090e2 Initial load duke parents: diff changeset	703	set_idom(zer_iff, new_main_exit, dd_main_exit);
489c9b5090e2 Initial load duke parents: diff changeset	704	set_loop(zer_iff, loop->_parent);
489c9b5090e2 Initial load duke parents: diff changeset	705
489c9b5090e2 Initial load duke parents: diff changeset	706	// Plug in the false-path, taken if we need to skip post-loop
489c9b5090e2 Initial load duke parents: diff changeset	707	_igvn.hash_delete( main_exit );
489c9b5090e2 Initial load duke parents: diff changeset	708	main_exit->set_req(0, zer_iff);
489c9b5090e2 Initial load duke parents: diff changeset	709	_igvn._worklist.push(main_exit);
489c9b5090e2 Initial load duke parents: diff changeset	710	set_idom(main_exit, zer_iff, dd_main_exit);
489c9b5090e2 Initial load duke parents: diff changeset	711	set_idom(main_exit->unique_out(), zer_iff, dd_main_exit);
489c9b5090e2 Initial load duke parents: diff changeset	712	// Make the true-path, must enter the post loop
489c9b5090e2 Initial load duke parents: diff changeset	713	Node *zer_taken = new (C, 1) IfTrueNode( zer_iff );
489c9b5090e2 Initial load duke parents: diff changeset	714	_igvn.register_new_node_with_optimizer( zer_taken );
489c9b5090e2 Initial load duke parents: diff changeset	715	set_idom(zer_taken, zer_iff, dd_main_exit);
489c9b5090e2 Initial load duke parents: diff changeset	716	set_loop(zer_taken, loop->_parent);
489c9b5090e2 Initial load duke parents: diff changeset	717	// Plug in the true path
489c9b5090e2 Initial load duke parents: diff changeset	718	_igvn.hash_delete( post_head );
489c9b5090e2 Initial load duke parents: diff changeset	719	post_head->set_req(LoopNode::EntryControl, zer_taken);
489c9b5090e2 Initial load duke parents: diff changeset	720	set_idom(post_head, zer_taken, dd_main_exit);
489c9b5090e2 Initial load duke parents: diff changeset	721
489c9b5090e2 Initial load duke parents: diff changeset	722	// Step A3: Make the fall-in values to the post-loop come from the
489c9b5090e2 Initial load duke parents: diff changeset	723	// fall-out values of the main-loop.
489c9b5090e2 Initial load duke parents: diff changeset	724	for (DUIterator_Fast imax, i = main_head->fast_outs(imax); i < imax; i++) {
489c9b5090e2 Initial load duke parents: diff changeset	725	Node* main_phi = main_head->fast_out(i);
489c9b5090e2 Initial load duke parents: diff changeset	726	if( main_phi->is_Phi() && main_phi->in(0) == main_head && main_phi->outcnt() >0 ) {
489c9b5090e2 Initial load duke parents: diff changeset	727	Node *post_phi = old_new[main_phi->_idx];
489c9b5090e2 Initial load duke parents: diff changeset	728	Node *fallmain = clone_up_backedge_goo(main_head->back_control(),
489c9b5090e2 Initial load duke parents: diff changeset	729	post_head->init_control(),
489c9b5090e2 Initial load duke parents: diff changeset	730	main_phi->in(LoopNode::LoopBackControl));
489c9b5090e2 Initial load duke parents: diff changeset	731	_igvn.hash_delete(post_phi);
489c9b5090e2 Initial load duke parents: diff changeset	732	post_phi->set_req( LoopNode::EntryControl, fallmain );
489c9b5090e2 Initial load duke parents: diff changeset	733	}
489c9b5090e2 Initial load duke parents: diff changeset	734	}
489c9b5090e2 Initial load duke parents: diff changeset	735
489c9b5090e2 Initial load duke parents: diff changeset	736	// Update local caches for next stanza
489c9b5090e2 Initial load duke parents: diff changeset	737	main_exit = new_main_exit;
489c9b5090e2 Initial load duke parents: diff changeset	738
489c9b5090e2 Initial load duke parents: diff changeset	739
489c9b5090e2 Initial load duke parents: diff changeset	740	//------------------------------
489c9b5090e2 Initial load duke parents: diff changeset	741	// Step B: Create Pre-Loop.
489c9b5090e2 Initial load duke parents: diff changeset	742
489c9b5090e2 Initial load duke parents: diff changeset	743	// Step B1: Clone the loop body. The clone becomes the pre-loop. The main
489c9b5090e2 Initial load duke parents: diff changeset	744	// loop pre-header illegally has 2 control users (old & new loops).
489c9b5090e2 Initial load duke parents: diff changeset	745	clone_loop( loop, old_new, dd_main_head );
489c9b5090e2 Initial load duke parents: diff changeset	746	CountedLoopNode* pre_head = old_new[main_head->_idx]->as_CountedLoop();
489c9b5090e2 Initial load duke parents: diff changeset	747	CountedLoopEndNode* pre_end = old_new[main_end ->_idx]->as_CountedLoopEnd();
489c9b5090e2 Initial load duke parents: diff changeset	748	pre_head->set_pre_loop(main_head);
489c9b5090e2 Initial load duke parents: diff changeset	749	Node *pre_incr = old_new[incr->_idx];
489c9b5090e2 Initial load duke parents: diff changeset	750
489c9b5090e2 Initial load duke parents: diff changeset	751	// Find the pre-loop normal exit.
489c9b5090e2 Initial load duke parents: diff changeset	752	Node* pre_exit = pre_end->proj_out(false);
489c9b5090e2 Initial load duke parents: diff changeset	753	assert( pre_exit->Opcode() == Op_IfFalse, "" );
489c9b5090e2 Initial load duke parents: diff changeset	754	IfFalseNode *new_pre_exit = new (C, 1) IfFalseNode(pre_end);
489c9b5090e2 Initial load duke parents: diff changeset	755	_igvn.register_new_node_with_optimizer( new_pre_exit );
489c9b5090e2 Initial load duke parents: diff changeset	756	set_idom(new_pre_exit, pre_end, dd_main_head);
489c9b5090e2 Initial load duke parents: diff changeset	757	set_loop(new_pre_exit, loop->_parent);
489c9b5090e2 Initial load duke parents: diff changeset	758
489c9b5090e2 Initial load duke parents: diff changeset	759	// Step B2: Build a zero-trip guard for the main-loop. After leaving the
489c9b5090e2 Initial load duke parents: diff changeset	760	// pre-loop, the main-loop may not execute at all. Later in life this
489c9b5090e2 Initial load duke parents: diff changeset	761	// zero-trip guard will become the minimum-trip guard when we unroll
489c9b5090e2 Initial load duke parents: diff changeset	762	// the main-loop.
489c9b5090e2 Initial load duke parents: diff changeset	763	Node *min_opaq = new (C, 2) Opaque1Node(limit);
489c9b5090e2 Initial load duke parents: diff changeset	764	Node *min_cmp = new (C, 3) CmpINode( pre_incr, min_opaq );
489c9b5090e2 Initial load duke parents: diff changeset	765	Node *min_bol = new (C, 2) BoolNode( min_cmp, b_test );
489c9b5090e2 Initial load duke parents: diff changeset	766	register_new_node( min_opaq, new_pre_exit );
489c9b5090e2 Initial load duke parents: diff changeset	767	register_new_node( min_cmp , new_pre_exit );
489c9b5090e2 Initial load duke parents: diff changeset	768	register_new_node( min_bol , new_pre_exit );
489c9b5090e2 Initial load duke parents: diff changeset	769
489c9b5090e2 Initial load duke parents: diff changeset	770	// Build the IfNode
489c9b5090e2 Initial load duke parents: diff changeset	771	IfNode *min_iff = new (C, 2) IfNode( new_pre_exit, min_bol, PROB_FAIR, COUNT_UNKNOWN );
489c9b5090e2 Initial load duke parents: diff changeset	772	_igvn.register_new_node_with_optimizer( min_iff );
489c9b5090e2 Initial load duke parents: diff changeset	773	set_idom(min_iff, new_pre_exit, dd_main_head);
489c9b5090e2 Initial load duke parents: diff changeset	774	set_loop(min_iff, loop->_parent);
489c9b5090e2 Initial load duke parents: diff changeset	775
489c9b5090e2 Initial load duke parents: diff changeset	776	// Plug in the false-path, taken if we need to skip main-loop
489c9b5090e2 Initial load duke parents: diff changeset	777	_igvn.hash_delete( pre_exit );
489c9b5090e2 Initial load duke parents: diff changeset	778	pre_exit->set_req(0, min_iff);
489c9b5090e2 Initial load duke parents: diff changeset	779	set_idom(pre_exit, min_iff, dd_main_head);
489c9b5090e2 Initial load duke parents: diff changeset	780	set_idom(pre_exit->unique_out(), min_iff, dd_main_head);
489c9b5090e2 Initial load duke parents: diff changeset	781	// Make the true-path, must enter the main loop
489c9b5090e2 Initial load duke parents: diff changeset	782	Node *min_taken = new (C, 1) IfTrueNode( min_iff );
489c9b5090e2 Initial load duke parents: diff changeset	783	_igvn.register_new_node_with_optimizer( min_taken );
489c9b5090e2 Initial load duke parents: diff changeset	784	set_idom(min_taken, min_iff, dd_main_head);
489c9b5090e2 Initial load duke parents: diff changeset	785	set_loop(min_taken, loop->_parent);
489c9b5090e2 Initial load duke parents: diff changeset	786	// Plug in the true path
489c9b5090e2 Initial load duke parents: diff changeset	787	_igvn.hash_delete( main_head );
489c9b5090e2 Initial load duke parents: diff changeset	788	main_head->set_req(LoopNode::EntryControl, min_taken);
489c9b5090e2 Initial load duke parents: diff changeset	789	set_idom(main_head, min_taken, dd_main_head);
489c9b5090e2 Initial load duke parents: diff changeset	790
489c9b5090e2 Initial load duke parents: diff changeset	791	// Step B3: Make the fall-in values to the main-loop come from the
489c9b5090e2 Initial load duke parents: diff changeset	792	// fall-out values of the pre-loop.
489c9b5090e2 Initial load duke parents: diff changeset	793	for (DUIterator_Fast i2max, i2 = main_head->fast_outs(i2max); i2 < i2max; i2++) {
489c9b5090e2 Initial load duke parents: diff changeset	794	Node* main_phi = main_head->fast_out(i2);
489c9b5090e2 Initial load duke parents: diff changeset	795	if( main_phi->is_Phi() && main_phi->in(0) == main_head && main_phi->outcnt() > 0 ) {
489c9b5090e2 Initial load duke parents: diff changeset	796	Node *pre_phi = old_new[main_phi->_idx];
489c9b5090e2 Initial load duke parents: diff changeset	797	Node *fallpre = clone_up_backedge_goo(pre_head->back_control(),
489c9b5090e2 Initial load duke parents: diff changeset	798	main_head->init_control(),
489c9b5090e2 Initial load duke parents: diff changeset	799	pre_phi->in(LoopNode::LoopBackControl));
489c9b5090e2 Initial load duke parents: diff changeset	800	_igvn.hash_delete(main_phi);
489c9b5090e2 Initial load duke parents: diff changeset	801	main_phi->set_req( LoopNode::EntryControl, fallpre );
489c9b5090e2 Initial load duke parents: diff changeset	802	}
489c9b5090e2 Initial load duke parents: diff changeset	803	}
489c9b5090e2 Initial load duke parents: diff changeset	804
489c9b5090e2 Initial load duke parents: diff changeset	805	// Step B4: Shorten the pre-loop to run only 1 iteration (for now).
489c9b5090e2 Initial load duke parents: diff changeset	806	// RCE and alignment may change this later.
489c9b5090e2 Initial load duke parents: diff changeset	807	Node *cmp_end = pre_end->cmp_node();
489c9b5090e2 Initial load duke parents: diff changeset	808	assert( cmp_end->in(2) == limit, "" );
489c9b5090e2 Initial load duke parents: diff changeset	809	Node *pre_limit = new (C, 3) AddINode( init, stride );
489c9b5090e2 Initial load duke parents: diff changeset	810
489c9b5090e2 Initial load duke parents: diff changeset	811	// Save the original loop limit in this Opaque1 node for
489c9b5090e2 Initial load duke parents: diff changeset	812	// use by range check elimination.
489c9b5090e2 Initial load duke parents: diff changeset	813	Node *pre_opaq = new (C, 3) Opaque1Node(pre_limit, limit);
489c9b5090e2 Initial load duke parents: diff changeset	814
489c9b5090e2 Initial load duke parents: diff changeset	815	register_new_node( pre_limit, pre_head->in(0) );
489c9b5090e2 Initial load duke parents: diff changeset	816	register_new_node( pre_opaq , pre_head->in(0) );
489c9b5090e2 Initial load duke parents: diff changeset	817
489c9b5090e2 Initial load duke parents: diff changeset	818	// Since no other users of pre-loop compare, I can hack limit directly
489c9b5090e2 Initial load duke parents: diff changeset	819	assert( cmp_end->outcnt() == 1, "no other users" );
489c9b5090e2 Initial load duke parents: diff changeset	820	_igvn.hash_delete(cmp_end);
489c9b5090e2 Initial load duke parents: diff changeset	821	cmp_end->set_req(2, peel_only ? pre_limit : pre_opaq);
489c9b5090e2 Initial load duke parents: diff changeset	822
489c9b5090e2 Initial load duke parents: diff changeset	823	// Special case for not-equal loop bounds:
489c9b5090e2 Initial load duke parents: diff changeset	824	// Change pre loop test, main loop test, and the
489c9b5090e2 Initial load duke parents: diff changeset	825	// main loop guard test to use lt or gt depending on stride
489c9b5090e2 Initial load duke parents: diff changeset	826	// direction:
489c9b5090e2 Initial load duke parents: diff changeset	827	// positive stride use <
489c9b5090e2 Initial load duke parents: diff changeset	828	// negative stride use >
489c9b5090e2 Initial load duke parents: diff changeset	829
489c9b5090e2 Initial load duke parents: diff changeset	830	if (pre_end->in(CountedLoopEndNode::TestValue)->as_Bool()->_test._test == BoolTest::ne) {
489c9b5090e2 Initial load duke parents: diff changeset	831
489c9b5090e2 Initial load duke parents: diff changeset	832	BoolTest::mask new_test = (main_end->stride_con() > 0) ? BoolTest::lt : BoolTest::gt;
489c9b5090e2 Initial load duke parents: diff changeset	833	// Modify pre loop end condition
489c9b5090e2 Initial load duke parents: diff changeset	834	Node* pre_bol = pre_end->in(CountedLoopEndNode::TestValue)->as_Bool();
489c9b5090e2 Initial load duke parents: diff changeset	835	BoolNode* new_bol0 = new (C, 2) BoolNode(pre_bol->in(1), new_test);
489c9b5090e2 Initial load duke parents: diff changeset	836	register_new_node( new_bol0, pre_head->in(0) );
489c9b5090e2 Initial load duke parents: diff changeset	837	_igvn.hash_delete(pre_end);
489c9b5090e2 Initial load duke parents: diff changeset	838	pre_end->set_req(CountedLoopEndNode::TestValue, new_bol0);
489c9b5090e2 Initial load duke parents: diff changeset	839	// Modify main loop guard condition
489c9b5090e2 Initial load duke parents: diff changeset	840	assert(min_iff->in(CountedLoopEndNode::TestValue) == min_bol, "guard okay");
489c9b5090e2 Initial load duke parents: diff changeset	841	BoolNode* new_bol1 = new (C, 2) BoolNode(min_bol->in(1), new_test);
489c9b5090e2 Initial load duke parents: diff changeset	842	register_new_node( new_bol1, new_pre_exit );
489c9b5090e2 Initial load duke parents: diff changeset	843	_igvn.hash_delete(min_iff);
489c9b5090e2 Initial load duke parents: diff changeset	844	min_iff->set_req(CountedLoopEndNode::TestValue, new_bol1);
489c9b5090e2 Initial load duke parents: diff changeset	845	// Modify main loop end condition
489c9b5090e2 Initial load duke parents: diff changeset	846	BoolNode* main_bol = main_end->in(CountedLoopEndNode::TestValue)->as_Bool();
489c9b5090e2 Initial load duke parents: diff changeset	847	BoolNode* new_bol2 = new (C, 2) BoolNode(main_bol->in(1), new_test);
489c9b5090e2 Initial load duke parents: diff changeset	848	register_new_node( new_bol2, main_end->in(CountedLoopEndNode::TestControl) );
489c9b5090e2 Initial load duke parents: diff changeset	849	_igvn.hash_delete(main_end);
489c9b5090e2 Initial load duke parents: diff changeset	850	main_end->set_req(CountedLoopEndNode::TestValue, new_bol2);
489c9b5090e2 Initial load duke parents: diff changeset	851	}
489c9b5090e2 Initial load duke parents: diff changeset	852
489c9b5090e2 Initial load duke parents: diff changeset	853	// Flag main loop
489c9b5090e2 Initial load duke parents: diff changeset	854	main_head->set_main_loop();
489c9b5090e2 Initial load duke parents: diff changeset	855	if( peel_only ) main_head->set_main_no_pre_loop();
489c9b5090e2 Initial load duke parents: diff changeset	856
489c9b5090e2 Initial load duke parents: diff changeset	857	// It's difficult to be precise about the trip-counts
489c9b5090e2 Initial load duke parents: diff changeset	858	// for the pre/post loops. They are usually very short,
489c9b5090e2 Initial load duke parents: diff changeset	859	// so guess that 4 trips is a reasonable value.
489c9b5090e2 Initial load duke parents: diff changeset	860	post_head->set_profile_trip_cnt(4.0);
489c9b5090e2 Initial load duke parents: diff changeset	861	pre_head->set_profile_trip_cnt(4.0);
489c9b5090e2 Initial load duke parents: diff changeset	862
489c9b5090e2 Initial load duke parents: diff changeset	863	// Now force out all loop-invariant dominating tests. The optimizer
489c9b5090e2 Initial load duke parents: diff changeset	864	// finds some, but we _know_ they are all useless.
489c9b5090e2 Initial load duke parents: diff changeset	865	peeled_dom_test_elim(loop,old_new);
489c9b5090e2 Initial load duke parents: diff changeset	866	}
489c9b5090e2 Initial load duke parents: diff changeset	867
489c9b5090e2 Initial load duke parents: diff changeset	868	//------------------------------is_invariant-----------------------------
489c9b5090e2 Initial load duke parents: diff changeset	869	// Return true if n is invariant
489c9b5090e2 Initial load duke parents: diff changeset	870	bool IdealLoopTree::is_invariant(Node* n) const {
489c9b5090e2 Initial load duke parents: diff changeset	871	Node *n_c = _phase->get_ctrl(n);
489c9b5090e2 Initial load duke parents: diff changeset	872	if (n_c->is_top()) return false;
489c9b5090e2 Initial load duke parents: diff changeset	873	return !is_member(_phase->get_loop(n_c));
489c9b5090e2 Initial load duke parents: diff changeset	874	}
489c9b5090e2 Initial load duke parents: diff changeset	875
489c9b5090e2 Initial load duke parents: diff changeset	876
489c9b5090e2 Initial load duke parents: diff changeset	877	//------------------------------do_unroll--------------------------------------
489c9b5090e2 Initial load duke parents: diff changeset	878	// Unroll the loop body one step - make each trip do 2 iterations.
489c9b5090e2 Initial load duke parents: diff changeset	879	void PhaseIdealLoop::do_unroll( IdealLoopTree *loop, Node_List &old_new, bool adjust_min_trip ) {
489c9b5090e2 Initial load duke parents: diff changeset	880	assert( LoopUnrollLimit, "" );
489c9b5090e2 Initial load duke parents: diff changeset	881	#ifndef PRODUCT
489c9b5090e2 Initial load duke parents: diff changeset	882	if( PrintOpto && VerifyLoopOptimizations ) {
489c9b5090e2 Initial load duke parents: diff changeset	883	tty->print("Unrolling ");
489c9b5090e2 Initial load duke parents: diff changeset	884	loop->dump_head();
489c9b5090e2 Initial load duke parents: diff changeset	885	}
489c9b5090e2 Initial load duke parents: diff changeset	886	#endif
489c9b5090e2 Initial load duke parents: diff changeset	887	CountedLoopNode *loop_head = loop->_head->as_CountedLoop();
489c9b5090e2 Initial load duke parents: diff changeset	888	CountedLoopEndNode *loop_end = loop_head->loopexit();
489c9b5090e2 Initial load duke parents: diff changeset	889	assert( loop_end, "" );
489c9b5090e2 Initial load duke parents: diff changeset	890
489c9b5090e2 Initial load duke parents: diff changeset	891	// Remember loop node count before unrolling to detect
489c9b5090e2 Initial load duke parents: diff changeset	892	// if rounds of unroll,optimize are making progress
489c9b5090e2 Initial load duke parents: diff changeset	893	loop_head->set_node_count_before_unroll(loop->_body.size());
489c9b5090e2 Initial load duke parents: diff changeset	894
489c9b5090e2 Initial load duke parents: diff changeset	895	Node *ctrl = loop_head->in(LoopNode::EntryControl);
489c9b5090e2 Initial load duke parents: diff changeset	896	Node *limit = loop_head->limit();
489c9b5090e2 Initial load duke parents: diff changeset	897	Node *init = loop_head->init_trip();
489c9b5090e2 Initial load duke parents: diff changeset	898	Node *strid = loop_head->stride();
489c9b5090e2 Initial load duke parents: diff changeset	899
489c9b5090e2 Initial load duke parents: diff changeset	900	Node *opaq = NULL;
489c9b5090e2 Initial load duke parents: diff changeset	901	if( adjust_min_trip ) { // If not maximally unrolling, need adjustment
489c9b5090e2 Initial load duke parents: diff changeset	902	assert( loop_head->is_main_loop(), "" );
489c9b5090e2 Initial load duke parents: diff changeset	903	assert( ctrl->Opcode() == Op_IfTrue \|\| ctrl->Opcode() == Op_IfFalse, "" );
489c9b5090e2 Initial load duke parents: diff changeset	904	Node *iff = ctrl->in(0);
489c9b5090e2 Initial load duke parents: diff changeset	905	assert( iff->Opcode() == Op_If, "" );
489c9b5090e2 Initial load duke parents: diff changeset	906	Node *bol = iff->in(1);
489c9b5090e2 Initial load duke parents: diff changeset	907	assert( bol->Opcode() == Op_Bool, "" );
489c9b5090e2 Initial load duke parents: diff changeset	908	Node *cmp = bol->in(1);
489c9b5090e2 Initial load duke parents: diff changeset	909	assert( cmp->Opcode() == Op_CmpI, "" );
489c9b5090e2 Initial load duke parents: diff changeset	910	opaq = cmp->in(2);
489c9b5090e2 Initial load duke parents: diff changeset	911	// Occasionally it's possible for a pre-loop Opaque1 node to be
489c9b5090e2 Initial load duke parents: diff changeset	912	// optimized away and then another round of loop opts attempted.
489c9b5090e2 Initial load duke parents: diff changeset	913	// We can not optimize this particular loop in that case.
489c9b5090e2 Initial load duke parents: diff changeset	914	if( opaq->Opcode() != Op_Opaque1 )
489c9b5090e2 Initial load duke parents: diff changeset	915	return; // Cannot find pre-loop! Bail out!
489c9b5090e2 Initial load duke parents: diff changeset	916	}
489c9b5090e2 Initial load duke parents: diff changeset	917
489c9b5090e2 Initial load duke parents: diff changeset	918	C->set_major_progress();
489c9b5090e2 Initial load duke parents: diff changeset	919
489c9b5090e2 Initial load duke parents: diff changeset	920	// Adjust max trip count. The trip count is intentionally rounded
489c9b5090e2 Initial load duke parents: diff changeset	921	// down here (e.g. 15-> 7-> 3-> 1) because if we unwittingly over-unroll,
489c9b5090e2 Initial load duke parents: diff changeset	922	// the main, unrolled, part of the loop will never execute as it is protected
489c9b5090e2 Initial load duke parents: diff changeset	923	// by the min-trip test. See bug 4834191 for a case where we over-unrolled
489c9b5090e2 Initial load duke parents: diff changeset	924	// and later determined that part of the unrolled loop was dead.
489c9b5090e2 Initial load duke parents: diff changeset	925	loop_head->set_trip_count(loop_head->trip_count() / 2);
489c9b5090e2 Initial load duke parents: diff changeset	926
489c9b5090e2 Initial load duke parents: diff changeset	927	// Double the count of original iterations in the unrolled loop body.
489c9b5090e2 Initial load duke parents: diff changeset	928	loop_head->double_unrolled_count();
489c9b5090e2 Initial load duke parents: diff changeset	929
489c9b5090e2 Initial load duke parents: diff changeset	930	// -----------
489c9b5090e2 Initial load duke parents: diff changeset	931	// Step 2: Cut back the trip counter for an unroll amount of 2.
489c9b5090e2 Initial load duke parents: diff changeset	932	// Loop will normally trip (limit - init)/stride_con. Since it's a
489c9b5090e2 Initial load duke parents: diff changeset	933	// CountedLoop this is exact (stride divides limit-init exactly).
489c9b5090e2 Initial load duke parents: diff changeset	934	// We are going to double the loop body, so we want to knock off any
489c9b5090e2 Initial load duke parents: diff changeset	935	// odd iteration: (trip_cnt & ~1). Then back compute a new limit.
489c9b5090e2 Initial load duke parents: diff changeset	936	Node *span = new (C, 3) SubINode( limit, init );
489c9b5090e2 Initial load duke parents: diff changeset	937	register_new_node( span, ctrl );
489c9b5090e2 Initial load duke parents: diff changeset	938	Node *trip = new (C, 3) DivINode( 0, span, strid );
489c9b5090e2 Initial load duke parents: diff changeset	939	register_new_node( trip, ctrl );
489c9b5090e2 Initial load duke parents: diff changeset	940	Node *mtwo = _igvn.intcon(-2);
489c9b5090e2 Initial load duke parents: diff changeset	941	set_ctrl(mtwo, C->root());
489c9b5090e2 Initial load duke parents: diff changeset	942	Node *rond = new (C, 3) AndINode( trip, mtwo );
489c9b5090e2 Initial load duke parents: diff changeset	943	register_new_node( rond, ctrl );
489c9b5090e2 Initial load duke parents: diff changeset	944	Node *spn2 = new (C, 3) MulINode( rond, strid );
489c9b5090e2 Initial load duke parents: diff changeset	945	register_new_node( spn2, ctrl );
489c9b5090e2 Initial load duke parents: diff changeset	946	Node *lim2 = new (C, 3) AddINode( spn2, init );
489c9b5090e2 Initial load duke parents: diff changeset	947	register_new_node( lim2, ctrl );
489c9b5090e2 Initial load duke parents: diff changeset	948
489c9b5090e2 Initial load duke parents: diff changeset	949	// Hammer in the new limit
489c9b5090e2 Initial load duke parents: diff changeset	950	Node *ctrl2 = loop_end->in(0);
489c9b5090e2 Initial load duke parents: diff changeset	951	Node *cmp2 = new (C, 3) CmpINode( loop_head->incr(), lim2 );
489c9b5090e2 Initial load duke parents: diff changeset	952	register_new_node( cmp2, ctrl2 );
489c9b5090e2 Initial load duke parents: diff changeset	953	Node *bol2 = new (C, 2) BoolNode( cmp2, loop_end->test_trip() );
489c9b5090e2 Initial load duke parents: diff changeset	954	register_new_node( bol2, ctrl2 );
489c9b5090e2 Initial load duke parents: diff changeset	955	_igvn.hash_delete(loop_end);
489c9b5090e2 Initial load duke parents: diff changeset	956	loop_end->set_req(CountedLoopEndNode::TestValue, bol2);
489c9b5090e2 Initial load duke parents: diff changeset	957
489c9b5090e2 Initial load duke parents: diff changeset	958	// Step 3: Find the min-trip test guaranteed before a 'main' loop.
489c9b5090e2 Initial load duke parents: diff changeset	959	// Make it a 1-trip test (means at least 2 trips).
489c9b5090e2 Initial load duke parents: diff changeset	960	if( adjust_min_trip ) {
489c9b5090e2 Initial load duke parents: diff changeset	961	// Guard test uses an 'opaque' node which is not shared. Hence I
489c9b5090e2 Initial load duke parents: diff changeset	962	// can edit it's inputs directly. Hammer in the new limit for the
489c9b5090e2 Initial load duke parents: diff changeset	963	// minimum-trip guard.
489c9b5090e2 Initial load duke parents: diff changeset	964	assert( opaq->outcnt() == 1, "" );
489c9b5090e2 Initial load duke parents: diff changeset	965	_igvn.hash_delete(opaq);
489c9b5090e2 Initial load duke parents: diff changeset	966	opaq->set_req(1, lim2);
489c9b5090e2 Initial load duke parents: diff changeset	967	}
489c9b5090e2 Initial load duke parents: diff changeset	968
489c9b5090e2 Initial load duke parents: diff changeset	969	// ---------
489c9b5090e2 Initial load duke parents: diff changeset	970	// Step 4: Clone the loop body. Move it inside the loop. This loop body
489c9b5090e2 Initial load duke parents: diff changeset	971	// represents the odd iterations; since the loop trips an even number of
489c9b5090e2 Initial load duke parents: diff changeset	972	// times its backedge is never taken. Kill the backedge.
489c9b5090e2 Initial load duke parents: diff changeset	973	uint dd = dom_depth(loop_head);
489c9b5090e2 Initial load duke parents: diff changeset	974	clone_loop( loop, old_new, dd );
489c9b5090e2 Initial load duke parents: diff changeset	975
489c9b5090e2 Initial load duke parents: diff changeset	976	// Make backedges of the clone equal to backedges of the original.
489c9b5090e2 Initial load duke parents: diff changeset	977	// Make the fall-in from the original come from the fall-out of the clone.
489c9b5090e2 Initial load duke parents: diff changeset	978	for (DUIterator_Fast jmax, j = loop_head->fast_outs(jmax); j < jmax; j++) {
489c9b5090e2 Initial load duke parents: diff changeset	979	Node* phi = loop_head->fast_out(j);
489c9b5090e2 Initial load duke parents: diff changeset	980	if( phi->is_Phi() && phi->in(0) == loop_head && phi->outcnt() > 0 ) {
489c9b5090e2 Initial load duke parents: diff changeset	981	Node *newphi = old_new[phi->_idx];
489c9b5090e2 Initial load duke parents: diff changeset	982	_igvn.hash_delete( phi );
489c9b5090e2 Initial load duke parents: diff changeset	983	_igvn.hash_delete( newphi );
489c9b5090e2 Initial load duke parents: diff changeset	984
489c9b5090e2 Initial load duke parents: diff changeset	985	phi ->set_req(LoopNode:: EntryControl, newphi->in(LoopNode::LoopBackControl));
489c9b5090e2 Initial load duke parents: diff changeset	986	newphi->set_req(LoopNode::LoopBackControl, phi ->in(LoopNode::LoopBackControl));
489c9b5090e2 Initial load duke parents: diff changeset	987	phi ->set_req(LoopNode::LoopBackControl, C->top());
489c9b5090e2 Initial load duke parents: diff changeset	988	}
489c9b5090e2 Initial load duke parents: diff changeset	989	}
489c9b5090e2 Initial load duke parents: diff changeset	990	Node *clone_head = old_new[loop_head->_idx];
489c9b5090e2 Initial load duke parents: diff changeset	991	_igvn.hash_delete( clone_head );
489c9b5090e2 Initial load duke parents: diff changeset	992	loop_head ->set_req(LoopNode:: EntryControl, clone_head->in(LoopNode::LoopBackControl));
489c9b5090e2 Initial load duke parents: diff changeset	993	clone_head->set_req(LoopNode::LoopBackControl, loop_head ->in(LoopNode::LoopBackControl));
489c9b5090e2 Initial load duke parents: diff changeset	994	loop_head ->set_req(LoopNode::LoopBackControl, C->top());
489c9b5090e2 Initial load duke parents: diff changeset	995	loop->_head = clone_head; // New loop header
489c9b5090e2 Initial load duke parents: diff changeset	996
489c9b5090e2 Initial load duke parents: diff changeset	997	set_idom(loop_head, loop_head ->in(LoopNode::EntryControl), dd);
489c9b5090e2 Initial load duke parents: diff changeset	998	set_idom(clone_head, clone_head->in(LoopNode::EntryControl), dd);
489c9b5090e2 Initial load duke parents: diff changeset	999
489c9b5090e2 Initial load duke parents: diff changeset	1000	// Kill the clone's backedge
489c9b5090e2 Initial load duke parents: diff changeset	1001	Node *newcle = old_new[loop_end->_idx];
489c9b5090e2 Initial load duke parents: diff changeset	1002	_igvn.hash_delete( newcle );
489c9b5090e2 Initial load duke parents: diff changeset	1003	Node *one = _igvn.intcon(1);
489c9b5090e2 Initial load duke parents: diff changeset	1004	set_ctrl(one, C->root());
489c9b5090e2 Initial load duke parents: diff changeset	1005	newcle->set_req(1, one);
489c9b5090e2 Initial load duke parents: diff changeset	1006	// Force clone into same loop body
489c9b5090e2 Initial load duke parents: diff changeset	1007	uint max = loop->_body.size();
489c9b5090e2 Initial load duke parents: diff changeset	1008	for( uint k = 0; k < max; k++ ) {
489c9b5090e2 Initial load duke parents: diff changeset	1009	Node *old = loop->_body.at(k);
489c9b5090e2 Initial load duke parents: diff changeset	1010	Node *nnn = old_new[old->_idx];
489c9b5090e2 Initial load duke parents: diff changeset	1011	loop->_body.push(nnn);
489c9b5090e2 Initial load duke parents: diff changeset	1012	if (!has_ctrl(old))
489c9b5090e2 Initial load duke parents: diff changeset	1013	set_loop(nnn, loop);
489c9b5090e2 Initial load duke parents: diff changeset	1014	}
489c9b5090e2 Initial load duke parents: diff changeset	1015	}
489c9b5090e2 Initial load duke parents: diff changeset	1016
489c9b5090e2 Initial load duke parents: diff changeset	1017	//------------------------------do_maximally_unroll----------------------------
489c9b5090e2 Initial load duke parents: diff changeset	1018
489c9b5090e2 Initial load duke parents: diff changeset	1019	void PhaseIdealLoop::do_maximally_unroll( IdealLoopTree *loop, Node_List &old_new ) {
489c9b5090e2 Initial load duke parents: diff changeset	1020	CountedLoopNode *cl = loop->_head->as_CountedLoop();
489c9b5090e2 Initial load duke parents: diff changeset	1021	assert( cl->trip_count() > 0, "");
489c9b5090e2 Initial load duke parents: diff changeset	1022
489c9b5090e2 Initial load duke parents: diff changeset	1023	// If loop is tripping an odd number of times, peel odd iteration
489c9b5090e2 Initial load duke parents: diff changeset	1024	if( (cl->trip_count() & 1) == 1 ) {
489c9b5090e2 Initial load duke parents: diff changeset	1025	do_peeling( loop, old_new );
489c9b5090e2 Initial load duke parents: diff changeset	1026	}
489c9b5090e2 Initial load duke parents: diff changeset	1027
489c9b5090e2 Initial load duke parents: diff changeset	1028	// Now its tripping an even number of times remaining. Double loop body.
489c9b5090e2 Initial load duke parents: diff changeset	1029	// Do not adjust pre-guards; they are not needed and do not exist.
489c9b5090e2 Initial load duke parents: diff changeset	1030	if( cl->trip_count() > 0 ) {
489c9b5090e2 Initial load duke parents: diff changeset	1031	do_unroll( loop, old_new, false );
489c9b5090e2 Initial load duke parents: diff changeset	1032	}
489c9b5090e2 Initial load duke parents: diff changeset	1033	}
489c9b5090e2 Initial load duke parents: diff changeset	1034
489c9b5090e2 Initial load duke parents: diff changeset	1035	//------------------------------dominates_backedge---------------------------------
489c9b5090e2 Initial load duke parents: diff changeset	1036	// Returns true if ctrl is executed on every complete iteration
489c9b5090e2 Initial load duke parents: diff changeset	1037	bool IdealLoopTree::dominates_backedge(Node* ctrl) {
489c9b5090e2 Initial load duke parents: diff changeset	1038	assert(ctrl->is_CFG(), "must be control");
489c9b5090e2 Initial load duke parents: diff changeset	1039	Node* backedge = _head->as_Loop()->in(LoopNode::LoopBackControl);
489c9b5090e2 Initial load duke parents: diff changeset	1040	return _phase->dom_lca_internal(ctrl, backedge) == ctrl;
489c9b5090e2 Initial load duke parents: diff changeset	1041	}
489c9b5090e2 Initial load duke parents: diff changeset	1042
489c9b5090e2 Initial load duke parents: diff changeset	1043	//------------------------------add_constraint---------------------------------
489c9b5090e2 Initial load duke parents: diff changeset	1044	// Constrain the main loop iterations so the condition:
489c9b5090e2 Initial load duke parents: diff changeset	1045	// scale_con * I + offset < limit
489c9b5090e2 Initial load duke parents: diff changeset	1046	// always holds true. That is, either increase the number of iterations in
489c9b5090e2 Initial load duke parents: diff changeset	1047	// the pre-loop or the post-loop until the condition holds true in the main
489c9b5090e2 Initial load duke parents: diff changeset	1048	// loop. Stride, scale, offset and limit are all loop invariant. Further,
489c9b5090e2 Initial load duke parents: diff changeset	1049	// stride and scale are constants (offset and limit often are).
489c9b5090e2 Initial load duke parents: diff changeset	1050	void PhaseIdealLoop::add_constraint( int stride_con, int scale_con, Node offset, Node limit, Node pre_ctrl, Node pre_limit, Node *main_limit ) {
489c9b5090e2 Initial load duke parents: diff changeset	1051
489c9b5090e2 Initial load duke parents: diff changeset	1052	// Compute "I :: (limit-offset)/scale_con"
489c9b5090e2 Initial load duke parents: diff changeset	1053	Node *con = new (C, 3) SubINode( limit, offset );
489c9b5090e2 Initial load duke parents: diff changeset	1054	register_new_node( con, pre_ctrl );
489c9b5090e2 Initial load duke parents: diff changeset	1055	Node *scale = _igvn.intcon(scale_con);
489c9b5090e2 Initial load duke parents: diff changeset	1056	set_ctrl(scale, C->root());
489c9b5090e2 Initial load duke parents: diff changeset	1057	Node *X = new (C, 3) DivINode( 0, con, scale );
489c9b5090e2 Initial load duke parents: diff changeset	1058	register_new_node( X, pre_ctrl );
489c9b5090e2 Initial load duke parents: diff changeset	1059
489c9b5090e2 Initial load duke parents: diff changeset	1060	// For positive stride, the pre-loop limit always uses a MAX function
489c9b5090e2 Initial load duke parents: diff changeset	1061	// and the main loop a MIN function. For negative stride these are
489c9b5090e2 Initial load duke parents: diff changeset	1062	// reversed.
489c9b5090e2 Initial load duke parents: diff changeset	1063
489c9b5090e2 Initial load duke parents: diff changeset	1064	// Also for positive stride*scale the affine function is increasing, so the
489c9b5090e2 Initial load duke parents: diff changeset	1065	// pre-loop must check for underflow and the post-loop for overflow.
489c9b5090e2 Initial load duke parents: diff changeset	1066	// Negative stride*scale reverses this; pre-loop checks for overflow and
489c9b5090e2 Initial load duke parents: diff changeset	1067	// post-loop for underflow.
489c9b5090e2 Initial load duke parents: diff changeset	1068	if( stride_con*scale_con > 0 ) {
489c9b5090e2 Initial load duke parents: diff changeset	1069	// Compute I < (limit-offset)/scale_con
489c9b5090e2 Initial load duke parents: diff changeset	1070	// Adjust main-loop last iteration to be MIN/MAX(main_loop,X)
489c9b5090e2 Initial load duke parents: diff changeset	1071	*main_limit = (stride_con > 0)
489c9b5090e2 Initial load duke parents: diff changeset	1072	? (Node)(new (C, 3) MinINode( main_limit, X ))
489c9b5090e2 Initial load duke parents: diff changeset	1073	: (Node)(new (C, 3) MaxINode( main_limit, X ));
489c9b5090e2 Initial load duke parents: diff changeset	1074	register_new_node( *main_limit, pre_ctrl );
489c9b5090e2 Initial load duke parents: diff changeset	1075
489c9b5090e2 Initial load duke parents: diff changeset	1076	} else {
489c9b5090e2 Initial load duke parents: diff changeset	1077	// Compute (limit-offset)/scale_con + SGN(-scale_con) <= I
489c9b5090e2 Initial load duke parents: diff changeset	1078	// Add the negation of the main-loop constraint to the pre-loop.
489c9b5090e2 Initial load duke parents: diff changeset	1079	// See footnote [++] below for a derivation of the limit expression.
489c9b5090e2 Initial load duke parents: diff changeset	1080	Node *incr = _igvn.intcon(scale_con > 0 ? -1 : 1);
489c9b5090e2 Initial load duke parents: diff changeset	1081	set_ctrl(incr, C->root());
489c9b5090e2 Initial load duke parents: diff changeset	1082	Node *adj = new (C, 3) AddINode( X, incr );
489c9b5090e2 Initial load duke parents: diff changeset	1083	register_new_node( adj, pre_ctrl );
489c9b5090e2 Initial load duke parents: diff changeset	1084	*pre_limit = (scale_con > 0)
489c9b5090e2 Initial load duke parents: diff changeset	1085	? (Node)new (C, 3) MinINode( pre_limit, adj )
489c9b5090e2 Initial load duke parents: diff changeset	1086	: (Node)new (C, 3) MaxINode( pre_limit, adj );
489c9b5090e2 Initial load duke parents: diff changeset	1087	register_new_node( *pre_limit, pre_ctrl );
489c9b5090e2 Initial load duke parents: diff changeset	1088
489c9b5090e2 Initial load duke parents: diff changeset	1089	// [++] Here's the algebra that justifies the pre-loop limit expression:
489c9b5090e2 Initial load duke parents: diff changeset	1090	//
489c9b5090e2 Initial load duke parents: diff changeset	1091	// NOT( scale_con * I + offset < limit )
489c9b5090e2 Initial load duke parents: diff changeset	1092	// ==
489c9b5090e2 Initial load duke parents: diff changeset	1093	// scale_con * I + offset >= limit
489c9b5090e2 Initial load duke parents: diff changeset	1094	// ==
489c9b5090e2 Initial load duke parents: diff changeset	1095	// SGN(scale_con) * I >= (limit-offset)/\|scale_con\|
489c9b5090e2 Initial load duke parents: diff changeset	1096	// ==
489c9b5090e2 Initial load duke parents: diff changeset	1097	// (limit-offset)/\|scale_con\| <= I * SGN(scale_con)
489c9b5090e2 Initial load duke parents: diff changeset	1098	// ==
489c9b5090e2 Initial load duke parents: diff changeset	1099	// (limit-offset)/\|scale_con\|-1 < I * SGN(scale_con)
489c9b5090e2 Initial load duke parents: diff changeset	1100	// ==
489c9b5090e2 Initial load duke parents: diff changeset	1101	// ( if (scale_con > 0) /common case/
489c9b5090e2 Initial load duke parents: diff changeset	1102	// (limit-offset)/scale_con - 1 < I
489c9b5090e2 Initial load duke parents: diff changeset	1103	// else
489c9b5090e2 Initial load duke parents: diff changeset	1104	// (limit-offset)/scale_con + 1 > I
489c9b5090e2 Initial load duke parents: diff changeset	1105	// )
489c9b5090e2 Initial load duke parents: diff changeset	1106	// ( if (scale_con > 0) /common case/
489c9b5090e2 Initial load duke parents: diff changeset	1107	// (limit-offset)/scale_con + SGN(-scale_con) < I
489c9b5090e2 Initial load duke parents: diff changeset	1108	// else
489c9b5090e2 Initial load duke parents: diff changeset	1109	// (limit-offset)/scale_con + SGN(-scale_con) > I
489c9b5090e2 Initial load duke parents: diff changeset	1110	}
489c9b5090e2 Initial load duke parents: diff changeset	1111	}
489c9b5090e2 Initial load duke parents: diff changeset	1112
489c9b5090e2 Initial load duke parents: diff changeset	1113
489c9b5090e2 Initial load duke parents: diff changeset	1114	//------------------------------is_scaled_iv---------------------------------
489c9b5090e2 Initial load duke parents: diff changeset	1115	// Return true if exp is a constant times an induction var
489c9b5090e2 Initial load duke parents: diff changeset	1116	bool PhaseIdealLoop::is_scaled_iv(Node* exp, Node* iv, int* p_scale) {
489c9b5090e2 Initial load duke parents: diff changeset	1117	if (exp == iv) {
489c9b5090e2 Initial load duke parents: diff changeset	1118	if (p_scale != NULL) {
489c9b5090e2 Initial load duke parents: diff changeset	1119	*p_scale = 1;
489c9b5090e2 Initial load duke parents: diff changeset	1120	}
489c9b5090e2 Initial load duke parents: diff changeset	1121	return true;
489c9b5090e2 Initial load duke parents: diff changeset	1122	}
489c9b5090e2 Initial load duke parents: diff changeset	1123	int opc = exp->Opcode();
489c9b5090e2 Initial load duke parents: diff changeset	1124	if (opc == Op_MulI) {
489c9b5090e2 Initial load duke parents: diff changeset	1125	if (exp->in(1) == iv && exp->in(2)->is_Con()) {
489c9b5090e2 Initial load duke parents: diff changeset	1126	if (p_scale != NULL) {
489c9b5090e2 Initial load duke parents: diff changeset	1127	*p_scale = exp->in(2)->get_int();
489c9b5090e2 Initial load duke parents: diff changeset	1128	}
489c9b5090e2 Initial load duke parents: diff changeset	1129	return true;
489c9b5090e2 Initial load duke parents: diff changeset	1130	}
489c9b5090e2 Initial load duke parents: diff changeset	1131	if (exp->in(2) == iv && exp->in(1)->is_Con()) {
489c9b5090e2 Initial load duke parents: diff changeset	1132	if (p_scale != NULL) {
489c9b5090e2 Initial load duke parents: diff changeset	1133	*p_scale = exp->in(1)->get_int();
489c9b5090e2 Initial load duke parents: diff changeset	1134	}
489c9b5090e2 Initial load duke parents: diff changeset	1135	return true;
489c9b5090e2 Initial load duke parents: diff changeset	1136	}
489c9b5090e2 Initial load duke parents: diff changeset	1137	} else if (opc == Op_LShiftI) {
489c9b5090e2 Initial load duke parents: diff changeset	1138	if (exp->in(1) == iv && exp->in(2)->is_Con()) {
489c9b5090e2 Initial load duke parents: diff changeset	1139	if (p_scale != NULL) {
489c9b5090e2 Initial load duke parents: diff changeset	1140	*p_scale = 1 << exp->in(2)->get_int();
489c9b5090e2 Initial load duke parents: diff changeset	1141	}
489c9b5090e2 Initial load duke parents: diff changeset	1142	return true;
489c9b5090e2 Initial load duke parents: diff changeset	1143	}
489c9b5090e2 Initial load duke parents: diff changeset	1144	}
489c9b5090e2 Initial load duke parents: diff changeset	1145	return false;
489c9b5090e2 Initial load duke parents: diff changeset	1146	}
489c9b5090e2 Initial load duke parents: diff changeset	1147
489c9b5090e2 Initial load duke parents: diff changeset	1148	//-----------------------------is_scaled_iv_plus_offset------------------------------
489c9b5090e2 Initial load duke parents: diff changeset	1149	// Return true if exp is a simple induction variable expression: k1*iv + (invar + k2)
489c9b5090e2 Initial load duke parents: diff changeset	1150	bool PhaseIdealLoop::is_scaled_iv_plus_offset(Node* exp, Node* iv, int* p_scale, Node** p_offset, int depth) {
489c9b5090e2 Initial load duke parents: diff changeset	1151	if (is_scaled_iv(exp, iv, p_scale)) {
489c9b5090e2 Initial load duke parents: diff changeset	1152	if (p_offset != NULL) {
489c9b5090e2 Initial load duke parents: diff changeset	1153	Node *zero = _igvn.intcon(0);
489c9b5090e2 Initial load duke parents: diff changeset	1154	set_ctrl(zero, C->root());
489c9b5090e2 Initial load duke parents: diff changeset	1155	*p_offset = zero;
489c9b5090e2 Initial load duke parents: diff changeset	1156	}
489c9b5090e2 Initial load duke parents: diff changeset	1157	return true;
489c9b5090e2 Initial load duke parents: diff changeset	1158	}
489c9b5090e2 Initial load duke parents: diff changeset	1159	int opc = exp->Opcode();
489c9b5090e2 Initial load duke parents: diff changeset	1160	if (opc == Op_AddI) {
489c9b5090e2 Initial load duke parents: diff changeset	1161	if (is_scaled_iv(exp->in(1), iv, p_scale)) {
489c9b5090e2 Initial load duke parents: diff changeset	1162	if (p_offset != NULL) {
489c9b5090e2 Initial load duke parents: diff changeset	1163	*p_offset = exp->in(2);
489c9b5090e2 Initial load duke parents: diff changeset	1164	}
489c9b5090e2 Initial load duke parents: diff changeset	1165	return true;
489c9b5090e2 Initial load duke parents: diff changeset	1166	}
489c9b5090e2 Initial load duke parents: diff changeset	1167	if (exp->in(2)->is_Con()) {
489c9b5090e2 Initial load duke parents: diff changeset	1168	Node* offset2 = NULL;
489c9b5090e2 Initial load duke parents: diff changeset	1169	if (depth < 2 &&
489c9b5090e2 Initial load duke parents: diff changeset	1170	is_scaled_iv_plus_offset(exp->in(1), iv, p_scale,
489c9b5090e2 Initial load duke parents: diff changeset	1171	p_offset != NULL ? &offset2 : NULL, depth+1)) {
489c9b5090e2 Initial load duke parents: diff changeset	1172	if (p_offset != NULL) {
489c9b5090e2 Initial load duke parents: diff changeset	1173	Node *ctrl_off2 = get_ctrl(offset2);
489c9b5090e2 Initial load duke parents: diff changeset	1174	Node* offset = new (C, 3) AddINode(offset2, exp->in(2));
489c9b5090e2 Initial load duke parents: diff changeset	1175	register_new_node(offset, ctrl_off2);
489c9b5090e2 Initial load duke parents: diff changeset	1176	*p_offset = offset;
489c9b5090e2 Initial load duke parents: diff changeset	1177	}
489c9b5090e2 Initial load duke parents: diff changeset	1178	return true;
489c9b5090e2 Initial load duke parents: diff changeset	1179	}
489c9b5090e2 Initial load duke parents: diff changeset	1180	}
489c9b5090e2 Initial load duke parents: diff changeset	1181	} else if (opc == Op_SubI) {
489c9b5090e2 Initial load duke parents: diff changeset	1182	if (is_scaled_iv(exp->in(1), iv, p_scale)) {
489c9b5090e2 Initial load duke parents: diff changeset	1183	if (p_offset != NULL) {
489c9b5090e2 Initial load duke parents: diff changeset	1184	Node *zero = _igvn.intcon(0);
489c9b5090e2 Initial load duke parents: diff changeset	1185	set_ctrl(zero, C->root());
489c9b5090e2 Initial load duke parents: diff changeset	1186	Node *ctrl_off = get_ctrl(exp->in(2));
489c9b5090e2 Initial load duke parents: diff changeset	1187	Node* offset = new (C, 3) SubINode(zero, exp->in(2));
489c9b5090e2 Initial load duke parents: diff changeset	1188	register_new_node(offset, ctrl_off);
489c9b5090e2 Initial load duke parents: diff changeset	1189	*p_offset = offset;
489c9b5090e2 Initial load duke parents: diff changeset	1190	}
489c9b5090e2 Initial load duke parents: diff changeset	1191	return true;
489c9b5090e2 Initial load duke parents: diff changeset	1192	}
489c9b5090e2 Initial load duke parents: diff changeset	1193	if (is_scaled_iv(exp->in(2), iv, p_scale)) {
489c9b5090e2 Initial load duke parents: diff changeset	1194	if (p_offset != NULL) {
489c9b5090e2 Initial load duke parents: diff changeset	1195	p_scale = -1;
489c9b5090e2 Initial load duke parents: diff changeset	1196	*p_offset = exp->in(1);
489c9b5090e2 Initial load duke parents: diff changeset	1197	}
489c9b5090e2 Initial load duke parents: diff changeset	1198	return true;
489c9b5090e2 Initial load duke parents: diff changeset	1199	}
489c9b5090e2 Initial load duke parents: diff changeset	1200	}
489c9b5090e2 Initial load duke parents: diff changeset	1201	return false;
489c9b5090e2 Initial load duke parents: diff changeset	1202	}
489c9b5090e2 Initial load duke parents: diff changeset	1203
489c9b5090e2 Initial load duke parents: diff changeset	1204	//------------------------------do_range_check---------------------------------
489c9b5090e2 Initial load duke parents: diff changeset	1205	// Eliminate range-checks and other trip-counter vs loop-invariant tests.
489c9b5090e2 Initial load duke parents: diff changeset	1206	void PhaseIdealLoop::do_range_check( IdealLoopTree *loop, Node_List &old_new ) {
489c9b5090e2 Initial load duke parents: diff changeset	1207	#ifndef PRODUCT
489c9b5090e2 Initial load duke parents: diff changeset	1208	if( PrintOpto && VerifyLoopOptimizations ) {
489c9b5090e2 Initial load duke parents: diff changeset	1209	tty->print("Range Check Elimination ");
489c9b5090e2 Initial load duke parents: diff changeset	1210	loop->dump_head();
489c9b5090e2 Initial load duke parents: diff changeset	1211	}
489c9b5090e2 Initial load duke parents: diff changeset	1212	#endif
489c9b5090e2 Initial load duke parents: diff changeset	1213	assert( RangeCheckElimination, "" );
489c9b5090e2 Initial load duke parents: diff changeset	1214	CountedLoopNode *cl = loop->_head->as_CountedLoop();
489c9b5090e2 Initial load duke parents: diff changeset	1215	assert( cl->is_main_loop(), "" );
489c9b5090e2 Initial load duke parents: diff changeset	1216
489c9b5090e2 Initial load duke parents: diff changeset	1217	// Find the trip counter; we are iteration splitting based on it
489c9b5090e2 Initial load duke parents: diff changeset	1218	Node *trip_counter = cl->phi();
489c9b5090e2 Initial load duke parents: diff changeset	1219	// Find the main loop limit; we will trim it's iterations
489c9b5090e2 Initial load duke parents: diff changeset	1220	// to not ever trip end tests
489c9b5090e2 Initial load duke parents: diff changeset	1221	Node *main_limit = cl->limit();
489c9b5090e2 Initial load duke parents: diff changeset	1222	// Find the pre-loop limit; we will expand it's iterations to
489c9b5090e2 Initial load duke parents: diff changeset	1223	// not ever trip low tests.
489c9b5090e2 Initial load duke parents: diff changeset	1224	Node *ctrl = cl->in(LoopNode::EntryControl);
489c9b5090e2 Initial load duke parents: diff changeset	1225	assert( ctrl->Opcode() == Op_IfTrue \|\| ctrl->Opcode() == Op_IfFalse, "" );
489c9b5090e2 Initial load duke parents: diff changeset	1226	Node *iffm = ctrl->in(0);
489c9b5090e2 Initial load duke parents: diff changeset	1227	assert( iffm->Opcode() == Op_If, "" );
489c9b5090e2 Initial load duke parents: diff changeset	1228	Node *p_f = iffm->in(0);
489c9b5090e2 Initial load duke parents: diff changeset	1229	assert( p_f->Opcode() == Op_IfFalse, "" );
489c9b5090e2 Initial load duke parents: diff changeset	1230	CountedLoopEndNode *pre_end = p_f->in(0)->as_CountedLoopEnd();
489c9b5090e2 Initial load duke parents: diff changeset	1231	assert( pre_end->loopnode()->is_pre_loop(), "" );
489c9b5090e2 Initial load duke parents: diff changeset	1232	Node *pre_opaq1 = pre_end->limit();
489c9b5090e2 Initial load duke parents: diff changeset	1233	// Occasionally it's possible for a pre-loop Opaque1 node to be
489c9b5090e2 Initial load duke parents: diff changeset	1234	// optimized away and then another round of loop opts attempted.
489c9b5090e2 Initial load duke parents: diff changeset	1235	// We can not optimize this particular loop in that case.
489c9b5090e2 Initial load duke parents: diff changeset	1236	if( pre_opaq1->Opcode() != Op_Opaque1 )
489c9b5090e2 Initial load duke parents: diff changeset	1237	return;
489c9b5090e2 Initial load duke parents: diff changeset	1238	Opaque1Node pre_opaq = (Opaque1Node)pre_opaq1;
489c9b5090e2 Initial load duke parents: diff changeset	1239	Node *pre_limit = pre_opaq->in(1);
489c9b5090e2 Initial load duke parents: diff changeset	1240
489c9b5090e2 Initial load duke parents: diff changeset	1241	// Where do we put new limit calculations
489c9b5090e2 Initial load duke parents: diff changeset	1242	Node *pre_ctrl = pre_end->loopnode()->in(LoopNode::EntryControl);
489c9b5090e2 Initial load duke parents: diff changeset	1243
489c9b5090e2 Initial load duke parents: diff changeset	1244	// Ensure the original loop limit is available from the
489c9b5090e2 Initial load duke parents: diff changeset	1245	// pre-loop Opaque1 node.
489c9b5090e2 Initial load duke parents: diff changeset	1246	Node *orig_limit = pre_opaq->original_loop_limit();
489c9b5090e2 Initial load duke parents: diff changeset	1247	if( orig_limit == NULL \|\| _igvn.type(orig_limit) == Type::TOP )
489c9b5090e2 Initial load duke parents: diff changeset	1248	return;
489c9b5090e2 Initial load duke parents: diff changeset	1249
489c9b5090e2 Initial load duke parents: diff changeset	1250	// Need to find the main-loop zero-trip guard
489c9b5090e2 Initial load duke parents: diff changeset	1251	Node *bolzm = iffm->in(1);
489c9b5090e2 Initial load duke parents: diff changeset	1252	assert( bolzm->Opcode() == Op_Bool, "" );
489c9b5090e2 Initial load duke parents: diff changeset	1253	Node *cmpzm = bolzm->in(1);
489c9b5090e2 Initial load duke parents: diff changeset	1254	assert( cmpzm->is_Cmp(), "" );
489c9b5090e2 Initial load duke parents: diff changeset	1255	Node *opqzm = cmpzm->in(2);
489c9b5090e2 Initial load duke parents: diff changeset	1256	if( opqzm->Opcode() != Op_Opaque1 )
489c9b5090e2 Initial load duke parents: diff changeset	1257	return;
489c9b5090e2 Initial load duke parents: diff changeset	1258	assert( opqzm->in(1) == main_limit, "do not understand situation" );
489c9b5090e2 Initial load duke parents: diff changeset	1259
489c9b5090e2 Initial load duke parents: diff changeset	1260	// Must know if its a count-up or count-down loop
489c9b5090e2 Initial load duke parents: diff changeset	1261
489c9b5090e2 Initial load duke parents: diff changeset	1262	// protect against stride not being a constant
489c9b5090e2 Initial load duke parents: diff changeset	1263	if ( !cl->stride_is_con() ) {
489c9b5090e2 Initial load duke parents: diff changeset	1264	return;
489c9b5090e2 Initial load duke parents: diff changeset	1265	}
489c9b5090e2 Initial load duke parents: diff changeset	1266	int stride_con = cl->stride_con();
489c9b5090e2 Initial load duke parents: diff changeset	1267	Node *zero = _igvn.intcon(0);
489c9b5090e2 Initial load duke parents: diff changeset	1268	Node *one = _igvn.intcon(1);
489c9b5090e2 Initial load duke parents: diff changeset	1269	set_ctrl(zero, C->root());
489c9b5090e2 Initial load duke parents: diff changeset	1270	set_ctrl(one, C->root());
489c9b5090e2 Initial load duke parents: diff changeset	1271
489c9b5090e2 Initial load duke parents: diff changeset	1272	// Range checks that do not dominate the loop backedge (ie.
489c9b5090e2 Initial load duke parents: diff changeset	1273	// conditionally executed) can lengthen the pre loop limit beyond
489c9b5090e2 Initial load duke parents: diff changeset	1274	// the original loop limit. To prevent this, the pre limit is
489c9b5090e2 Initial load duke parents: diff changeset	1275	// (for stride > 0) MINed with the original loop limit (MAXed
489c9b5090e2 Initial load duke parents: diff changeset	1276	// stride < 0) when some range_check (rc) is conditionally
489c9b5090e2 Initial load duke parents: diff changeset	1277	// executed.
489c9b5090e2 Initial load duke parents: diff changeset	1278	bool conditional_rc = false;
489c9b5090e2 Initial load duke parents: diff changeset	1279
489c9b5090e2 Initial load duke parents: diff changeset	1280	// Check loop body for tests of trip-counter plus loop-invariant vs
489c9b5090e2 Initial load duke parents: diff changeset	1281	// loop-invariant.
489c9b5090e2 Initial load duke parents: diff changeset	1282	for( uint i = 0; i < loop->_body.size(); i++ ) {
489c9b5090e2 Initial load duke parents: diff changeset	1283	Node *iff = loop->_body[i];
489c9b5090e2 Initial load duke parents: diff changeset	1284	if( iff->Opcode() == Op_If ) { // Test?
489c9b5090e2 Initial load duke parents: diff changeset	1285
489c9b5090e2 Initial load duke parents: diff changeset	1286	// Test is an IfNode, has 2 projections. If BOTH are in the loop
489c9b5090e2 Initial load duke parents: diff changeset	1287	// we need loop unswitching instead of iteration splitting.
489c9b5090e2 Initial load duke parents: diff changeset	1288	Node *exit = loop->is_loop_exit(iff);
489c9b5090e2 Initial load duke parents: diff changeset	1289	if( !exit ) continue;
489c9b5090e2 Initial load duke parents: diff changeset	1290	int flip = (exit->Opcode() == Op_IfTrue) ? 1 : 0;
489c9b5090e2 Initial load duke parents: diff changeset	1291
489c9b5090e2 Initial load duke parents: diff changeset	1292	// Get boolean condition to test
489c9b5090e2 Initial load duke parents: diff changeset	1293	Node *i1 = iff->in(1);
489c9b5090e2 Initial load duke parents: diff changeset	1294	if( !i1->is_Bool() ) continue;
489c9b5090e2 Initial load duke parents: diff changeset	1295	BoolNode *bol = i1->as_Bool();
489c9b5090e2 Initial load duke parents: diff changeset	1296	BoolTest b_test = bol->_test;
489c9b5090e2 Initial load duke parents: diff changeset	1297	// Flip sense of test if exit condition is flipped
489c9b5090e2 Initial load duke parents: diff changeset	1298	if( flip )
489c9b5090e2 Initial load duke parents: diff changeset	1299	b_test = b_test.negate();
489c9b5090e2 Initial load duke parents: diff changeset	1300
489c9b5090e2 Initial load duke parents: diff changeset	1301	// Get compare
489c9b5090e2 Initial load duke parents: diff changeset	1302	Node *cmp = bol->in(1);
489c9b5090e2 Initial load duke parents: diff changeset	1303
489c9b5090e2 Initial load duke parents: diff changeset	1304	// Look for trip_counter + offset vs limit
489c9b5090e2 Initial load duke parents: diff changeset	1305	Node *rc_exp = cmp->in(1);
489c9b5090e2 Initial load duke parents: diff changeset	1306	Node *limit = cmp->in(2);
489c9b5090e2 Initial load duke parents: diff changeset	1307	jint scale_con= 1; // Assume trip counter not scaled
489c9b5090e2 Initial load duke parents: diff changeset	1308
489c9b5090e2 Initial load duke parents: diff changeset	1309	Node *limit_c = get_ctrl(limit);
489c9b5090e2 Initial load duke parents: diff changeset	1310	if( loop->is_member(get_loop(limit_c) ) ) {
489c9b5090e2 Initial load duke parents: diff changeset	1311	// Compare might have operands swapped; commute them
489c9b5090e2 Initial load duke parents: diff changeset	1312	b_test = b_test.commute();
489c9b5090e2 Initial load duke parents: diff changeset	1313	rc_exp = cmp->in(2);
489c9b5090e2 Initial load duke parents: diff changeset	1314	limit = cmp->in(1);
489c9b5090e2 Initial load duke parents: diff changeset	1315	limit_c = get_ctrl(limit);
489c9b5090e2 Initial load duke parents: diff changeset	1316	if( loop->is_member(get_loop(limit_c) ) )
489c9b5090e2 Initial load duke parents: diff changeset	1317	continue; // Both inputs are loop varying; cannot RCE
489c9b5090e2 Initial load duke parents: diff changeset	1318	}
489c9b5090e2 Initial load duke parents: diff changeset	1319	// Here we know 'limit' is loop invariant
489c9b5090e2 Initial load duke parents: diff changeset	1320
489c9b5090e2 Initial load duke parents: diff changeset	1321	// 'limit' maybe pinned below the zero trip test (probably from a
489c9b5090e2 Initial load duke parents: diff changeset	1322	// previous round of rce), in which case, it can't be used in the
489c9b5090e2 Initial load duke parents: diff changeset	1323	// zero trip test expression which must occur before the zero test's if.
489c9b5090e2 Initial load duke parents: diff changeset	1324	if( limit_c == ctrl ) {
489c9b5090e2 Initial load duke parents: diff changeset	1325	continue; // Don't rce this check but continue looking for other candidates.
489c9b5090e2 Initial load duke parents: diff changeset	1326	}
489c9b5090e2 Initial load duke parents: diff changeset	1327
489c9b5090e2 Initial load duke parents: diff changeset	1328	// Check for scaled induction variable plus an offset
489c9b5090e2 Initial load duke parents: diff changeset	1329	Node *offset = NULL;
489c9b5090e2 Initial load duke parents: diff changeset	1330
489c9b5090e2 Initial load duke parents: diff changeset	1331	if (!is_scaled_iv_plus_offset(rc_exp, trip_counter, &scale_con, &offset)) {
489c9b5090e2 Initial load duke parents: diff changeset	1332	continue;
489c9b5090e2 Initial load duke parents: diff changeset	1333	}
489c9b5090e2 Initial load duke parents: diff changeset	1334
489c9b5090e2 Initial load duke parents: diff changeset	1335	Node *offset_c = get_ctrl(offset);
489c9b5090e2 Initial load duke parents: diff changeset	1336	if( loop->is_member( get_loop(offset_c) ) )
489c9b5090e2 Initial load duke parents: diff changeset	1337	continue; // Offset is not really loop invariant
489c9b5090e2 Initial load duke parents: diff changeset	1338	// Here we know 'offset' is loop invariant.
489c9b5090e2 Initial load duke parents: diff changeset	1339
489c9b5090e2 Initial load duke parents: diff changeset	1340	// As above for the 'limit', the 'offset' maybe pinned below the
489c9b5090e2 Initial load duke parents: diff changeset	1341	// zero trip test.
489c9b5090e2 Initial load duke parents: diff changeset	1342	if( offset_c == ctrl ) {
489c9b5090e2 Initial load duke parents: diff changeset	1343	continue; // Don't rce this check but continue looking for other candidates.
489c9b5090e2 Initial load duke parents: diff changeset	1344	}
489c9b5090e2 Initial load duke parents: diff changeset	1345
489c9b5090e2 Initial load duke parents: diff changeset	1346	// At this point we have the expression as:
489c9b5090e2 Initial load duke parents: diff changeset	1347	// scale_con * trip_counter + offset :: limit
489c9b5090e2 Initial load duke parents: diff changeset	1348	// where scale_con, offset and limit are loop invariant. Trip_counter
489c9b5090e2 Initial load duke parents: diff changeset	1349	// monotonically increases by stride_con, a constant. Both (or either)
489c9b5090e2 Initial load duke parents: diff changeset	1350	// stride_con and scale_con can be negative which will flip about the
489c9b5090e2 Initial load duke parents: diff changeset	1351	// sense of the test.
489c9b5090e2 Initial load duke parents: diff changeset	1352
489c9b5090e2 Initial load duke parents: diff changeset	1353	// Adjust pre and main loop limits to guard the correct iteration set
489c9b5090e2 Initial load duke parents: diff changeset	1354	if( cmp->Opcode() == Op_CmpU ) {// Unsigned compare is really 2 tests
489c9b5090e2 Initial load duke parents: diff changeset	1355	if( b_test._test == BoolTest::lt ) { // Range checks always use lt
489c9b5090e2 Initial load duke parents: diff changeset	1356	// The overflow limit: scale*I+offset < limit
489c9b5090e2 Initial load duke parents: diff changeset	1357	add_constraint( stride_con, scale_con, offset, limit, pre_ctrl, &pre_limit, &main_limit );
489c9b5090e2 Initial load duke parents: diff changeset	1358	// The underflow limit: 0 <= scale*I+offset.
489c9b5090e2 Initial load duke parents: diff changeset	1359	// Some math yields: -scale*I-(offset+1) < 0
489c9b5090e2 Initial load duke parents: diff changeset	1360	Node *plus_one = new (C, 3) AddINode( offset, one );
489c9b5090e2 Initial load duke parents: diff changeset	1361	register_new_node( plus_one, pre_ctrl );
489c9b5090e2 Initial load duke parents: diff changeset	1362	Node *neg_offset = new (C, 3) SubINode( zero, plus_one );
489c9b5090e2 Initial load duke parents: diff changeset	1363	register_new_node( neg_offset, pre_ctrl );
489c9b5090e2 Initial load duke parents: diff changeset	1364	add_constraint( stride_con, -scale_con, neg_offset, zero, pre_ctrl, &pre_limit, &main_limit );
489c9b5090e2 Initial load duke parents: diff changeset	1365	if (!conditional_rc) {
489c9b5090e2 Initial load duke parents: diff changeset	1366	conditional_rc = !loop->dominates_backedge(iff);
489c9b5090e2 Initial load duke parents: diff changeset	1367	}
489c9b5090e2 Initial load duke parents: diff changeset	1368	} else {
489c9b5090e2 Initial load duke parents: diff changeset	1369	#ifndef PRODUCT
489c9b5090e2 Initial load duke parents: diff changeset	1370	if( PrintOpto )
489c9b5090e2 Initial load duke parents: diff changeset	1371	tty->print_cr("missed RCE opportunity");
489c9b5090e2 Initial load duke parents: diff changeset	1372	#endif
489c9b5090e2 Initial load duke parents: diff changeset	1373	continue; // In release mode, ignore it
489c9b5090e2 Initial load duke parents: diff changeset	1374	}
489c9b5090e2 Initial load duke parents: diff changeset	1375	} else { // Otherwise work on normal compares
489c9b5090e2 Initial load duke parents: diff changeset	1376	switch( b_test._test ) {
489c9b5090e2 Initial load duke parents: diff changeset	1377	case BoolTest::ge: // Convert X >= Y to -X <= -Y
489c9b5090e2 Initial load duke parents: diff changeset	1378	scale_con = -scale_con;
489c9b5090e2 Initial load duke parents: diff changeset	1379	offset = new (C, 3) SubINode( zero, offset );
489c9b5090e2 Initial load duke parents: diff changeset	1380	register_new_node( offset, pre_ctrl );
489c9b5090e2 Initial load duke parents: diff changeset	1381	limit = new (C, 3) SubINode( zero, limit );
489c9b5090e2 Initial load duke parents: diff changeset	1382	register_new_node( limit, pre_ctrl );
489c9b5090e2 Initial load duke parents: diff changeset	1383	// Fall into LE case
489c9b5090e2 Initial load duke parents: diff changeset	1384	case BoolTest::le: // Convert X <= Y to X < Y+1
489c9b5090e2 Initial load duke parents: diff changeset	1385	limit = new (C, 3) AddINode( limit, one );
489c9b5090e2 Initial load duke parents: diff changeset	1386	register_new_node( limit, pre_ctrl );
489c9b5090e2 Initial load duke parents: diff changeset	1387	// Fall into LT case
489c9b5090e2 Initial load duke parents: diff changeset	1388	case BoolTest::lt:
489c9b5090e2 Initial load duke parents: diff changeset	1389	add_constraint( stride_con, scale_con, offset, limit, pre_ctrl, &pre_limit, &main_limit );
489c9b5090e2 Initial load duke parents: diff changeset	1390	if (!conditional_rc) {
489c9b5090e2 Initial load duke parents: diff changeset	1391	conditional_rc = !loop->dominates_backedge(iff);
489c9b5090e2 Initial load duke parents: diff changeset	1392	}
489c9b5090e2 Initial load duke parents: diff changeset	1393	break;
489c9b5090e2 Initial load duke parents: diff changeset	1394	default:
489c9b5090e2 Initial load duke parents: diff changeset	1395	#ifndef PRODUCT
489c9b5090e2 Initial load duke parents: diff changeset	1396	if( PrintOpto )
489c9b5090e2 Initial load duke parents: diff changeset	1397	tty->print_cr("missed RCE opportunity");
489c9b5090e2 Initial load duke parents: diff changeset	1398	#endif
489c9b5090e2 Initial load duke parents: diff changeset	1399	continue; // Unhandled case
489c9b5090e2 Initial load duke parents: diff changeset	1400	}
489c9b5090e2 Initial load duke parents: diff changeset	1401	}
489c9b5090e2 Initial load duke parents: diff changeset	1402
489c9b5090e2 Initial load duke parents: diff changeset	1403	// Kill the eliminated test
489c9b5090e2 Initial load duke parents: diff changeset	1404	C->set_major_progress();
489c9b5090e2 Initial load duke parents: diff changeset	1405	Node *kill_con = _igvn.intcon( 1-flip );
489c9b5090e2 Initial load duke parents: diff changeset	1406	set_ctrl(kill_con, C->root());
489c9b5090e2 Initial load duke parents: diff changeset	1407	_igvn.hash_delete(iff);
489c9b5090e2 Initial load duke parents: diff changeset	1408	iff->set_req(1, kill_con);
489c9b5090e2 Initial load duke parents: diff changeset	1409	_igvn._worklist.push(iff);
489c9b5090e2 Initial load duke parents: diff changeset	1410	// Find surviving projection
489c9b5090e2 Initial load duke parents: diff changeset	1411	assert(iff->is_If(), "");
489c9b5090e2 Initial load duke parents: diff changeset	1412	ProjNode* dp = ((IfNode*)iff)->proj_out(1-flip);
489c9b5090e2 Initial load duke parents: diff changeset	1413	// Find loads off the surviving projection; remove their control edge
489c9b5090e2 Initial load duke parents: diff changeset	1414	for (DUIterator_Fast imax, i = dp->fast_outs(imax); i < imax; i++) {
489c9b5090e2 Initial load duke parents: diff changeset	1415	Node* cd = dp->fast_out(i); // Control-dependent node
489c9b5090e2 Initial load duke parents: diff changeset	1416	if( cd->is_Load() ) { // Loads can now float around in the loop
489c9b5090e2 Initial load duke parents: diff changeset	1417	_igvn.hash_delete(cd);
489c9b5090e2 Initial load duke parents: diff changeset	1418	// Allow the load to float around in the loop, or before it
489c9b5090e2 Initial load duke parents: diff changeset	1419	// but NOT before the pre-loop.
489c9b5090e2 Initial load duke parents: diff changeset	1420	cd->set_req(0, ctrl); // ctrl, not NULL
489c9b5090e2 Initial load duke parents: diff changeset	1421	_igvn._worklist.push(cd);
489c9b5090e2 Initial load duke parents: diff changeset	1422	--i;
489c9b5090e2 Initial load duke parents: diff changeset	1423	--imax;
489c9b5090e2 Initial load duke parents: diff changeset	1424	}
489c9b5090e2 Initial load duke parents: diff changeset	1425	}
489c9b5090e2 Initial load duke parents: diff changeset	1426
489c9b5090e2 Initial load duke parents: diff changeset	1427	} // End of is IF
489c9b5090e2 Initial load duke parents: diff changeset	1428
489c9b5090e2 Initial load duke parents: diff changeset	1429	}
489c9b5090e2 Initial load duke parents: diff changeset	1430
489c9b5090e2 Initial load duke parents: diff changeset	1431	// Update loop limits
489c9b5090e2 Initial load duke parents: diff changeset	1432	if (conditional_rc) {
489c9b5090e2 Initial load duke parents: diff changeset	1433	pre_limit = (stride_con > 0) ? (Node*)new (C,3) MinINode(pre_limit, orig_limit)
489c9b5090e2 Initial load duke parents: diff changeset	1434	: (Node*)new (C,3) MaxINode(pre_limit, orig_limit);
489c9b5090e2 Initial load duke parents: diff changeset	1435	register_new_node(pre_limit, pre_ctrl);
489c9b5090e2 Initial load duke parents: diff changeset	1436	}
489c9b5090e2 Initial load duke parents: diff changeset	1437	_igvn.hash_delete(pre_opaq);
489c9b5090e2 Initial load duke parents: diff changeset	1438	pre_opaq->set_req(1, pre_limit);
489c9b5090e2 Initial load duke parents: diff changeset	1439
489c9b5090e2 Initial load duke parents: diff changeset	1440	// Note:: we are making the main loop limit no longer precise;
489c9b5090e2 Initial load duke parents: diff changeset	1441	// need to round up based on stride.
489c9b5090e2 Initial load duke parents: diff changeset	1442	if( stride_con != 1 && stride_con != -1 ) { // Cutout for common case
489c9b5090e2 Initial load duke parents: diff changeset	1443	// "Standard" round-up logic: ([main_limit-init+(y-1)]/y)*y+init
489c9b5090e2 Initial load duke parents: diff changeset	1444	// Hopefully, compiler will optimize for powers of 2.
489c9b5090e2 Initial load duke parents: diff changeset	1445	Node *ctrl = get_ctrl(main_limit);
489c9b5090e2 Initial load duke parents: diff changeset	1446	Node *stride = cl->stride();
489c9b5090e2 Initial load duke parents: diff changeset	1447	Node *init = cl->init_trip();
489c9b5090e2 Initial load duke parents: diff changeset	1448	Node *span = new (C, 3) SubINode(main_limit,init);
489c9b5090e2 Initial load duke parents: diff changeset	1449	register_new_node(span,ctrl);
489c9b5090e2 Initial load duke parents: diff changeset	1450	Node *rndup = _igvn.intcon(stride_con + ((stride_con>0)?-1:1));
489c9b5090e2 Initial load duke parents: diff changeset	1451	Node *add = new (C, 3) AddINode(span,rndup);
489c9b5090e2 Initial load duke parents: diff changeset	1452	register_new_node(add,ctrl);
489c9b5090e2 Initial load duke parents: diff changeset	1453	Node *div = new (C, 3) DivINode(0,add,stride);
489c9b5090e2 Initial load duke parents: diff changeset	1454	register_new_node(div,ctrl);
489c9b5090e2 Initial load duke parents: diff changeset	1455	Node *mul = new (C, 3) MulINode(div,stride);
489c9b5090e2 Initial load duke parents: diff changeset	1456	register_new_node(mul,ctrl);
489c9b5090e2 Initial load duke parents: diff changeset	1457	Node *newlim = new (C, 3) AddINode(mul,init);
489c9b5090e2 Initial load duke parents: diff changeset	1458	register_new_node(newlim,ctrl);
489c9b5090e2 Initial load duke parents: diff changeset	1459	main_limit = newlim;
489c9b5090e2 Initial load duke parents: diff changeset	1460	}
489c9b5090e2 Initial load duke parents: diff changeset	1461
489c9b5090e2 Initial load duke parents: diff changeset	1462	Node *main_cle = cl->loopexit();
489c9b5090e2 Initial load duke parents: diff changeset	1463	Node *main_bol = main_cle->in(1);
489c9b5090e2 Initial load duke parents: diff changeset	1464	// Hacking loop bounds; need private copies of exit test
489c9b5090e2 Initial load duke parents: diff changeset	1465	if( main_bol->outcnt() > 1 ) {// BoolNode shared?
489c9b5090e2 Initial load duke parents: diff changeset	1466	_igvn.hash_delete(main_cle);
489c9b5090e2 Initial load duke parents: diff changeset	1467	main_bol = main_bol->clone();// Clone a private BoolNode
489c9b5090e2 Initial load duke parents: diff changeset	1468	register_new_node( main_bol, main_cle->in(0) );
489c9b5090e2 Initial load duke parents: diff changeset	1469	main_cle->set_req(1,main_bol);
489c9b5090e2 Initial load duke parents: diff changeset	1470	}
489c9b5090e2 Initial load duke parents: diff changeset	1471	Node *main_cmp = main_bol->in(1);
489c9b5090e2 Initial load duke parents: diff changeset	1472	if( main_cmp->outcnt() > 1 ) { // CmpNode shared?
489c9b5090e2 Initial load duke parents: diff changeset	1473	_igvn.hash_delete(main_bol);
489c9b5090e2 Initial load duke parents: diff changeset	1474	main_cmp = main_cmp->clone();// Clone a private CmpNode
489c9b5090e2 Initial load duke parents: diff changeset	1475	register_new_node( main_cmp, main_cle->in(0) );
489c9b5090e2 Initial load duke parents: diff changeset	1476	main_bol->set_req(1,main_cmp);
489c9b5090e2 Initial load duke parents: diff changeset	1477	}
489c9b5090e2 Initial load duke parents: diff changeset	1478	// Hack the now-private loop bounds
489c9b5090e2 Initial load duke parents: diff changeset	1479	_igvn.hash_delete(main_cmp);
489c9b5090e2 Initial load duke parents: diff changeset	1480	main_cmp->set_req(2, main_limit);
489c9b5090e2 Initial load duke parents: diff changeset	1481	_igvn._worklist.push(main_cmp);
489c9b5090e2 Initial load duke parents: diff changeset	1482	// The OpaqueNode is unshared by design
489c9b5090e2 Initial load duke parents: diff changeset	1483	_igvn.hash_delete(opqzm);
489c9b5090e2 Initial load duke parents: diff changeset	1484	assert( opqzm->outcnt() == 1, "cannot hack shared node" );
489c9b5090e2 Initial load duke parents: diff changeset	1485	opqzm->set_req(1,main_limit);
489c9b5090e2 Initial load duke parents: diff changeset	1486	_igvn._worklist.push(opqzm);
489c9b5090e2 Initial load duke parents: diff changeset	1487	}
489c9b5090e2 Initial load duke parents: diff changeset	1488
489c9b5090e2 Initial load duke parents: diff changeset	1489	//------------------------------DCE_loop_body----------------------------------
489c9b5090e2 Initial load duke parents: diff changeset	1490	// Remove simplistic dead code from loop body
489c9b5090e2 Initial load duke parents: diff changeset	1491	void IdealLoopTree::DCE_loop_body() {
489c9b5090e2 Initial load duke parents: diff changeset	1492	for( uint i = 0; i < _body.size(); i++ )
489c9b5090e2 Initial load duke parents: diff changeset	1493	if( _body.at(i)->outcnt() == 0 )
489c9b5090e2 Initial load duke parents: diff changeset	1494	_body.map( i--, _body.pop() );
489c9b5090e2 Initial load duke parents: diff changeset	1495	}
489c9b5090e2 Initial load duke parents: diff changeset	1496
489c9b5090e2 Initial load duke parents: diff changeset	1497
489c9b5090e2 Initial load duke parents: diff changeset	1498	//------------------------------adjust_loop_exit_prob--------------------------
489c9b5090e2 Initial load duke parents: diff changeset	1499	// Look for loop-exit tests with the 50/50 (or worse) guesses from the parsing stage.
489c9b5090e2 Initial load duke parents: diff changeset	1500	// Replace with a 1-in-10 exit guess.
489c9b5090e2 Initial load duke parents: diff changeset	1501	void IdealLoopTree::adjust_loop_exit_prob( PhaseIdealLoop *phase ) {
489c9b5090e2 Initial load duke parents: diff changeset	1502	Node *test = tail();
489c9b5090e2 Initial load duke parents: diff changeset	1503	while( test != _head ) {
489c9b5090e2 Initial load duke parents: diff changeset	1504	uint top = test->Opcode();
489c9b5090e2 Initial load duke parents: diff changeset	1505	if( top == Op_IfTrue \|\| top == Op_IfFalse ) {
489c9b5090e2 Initial load duke parents: diff changeset	1506	int test_con = ((ProjNode*)test)->_con;
489c9b5090e2 Initial load duke parents: diff changeset	1507	assert(top == (uint)(test_con? Op_IfTrue: Op_IfFalse), "sanity");
489c9b5090e2 Initial load duke parents: diff changeset	1508	IfNode *iff = test->in(0)->as_If();
489c9b5090e2 Initial load duke parents: diff changeset	1509	if( iff->outcnt() == 2 ) { // Ignore dead tests
489c9b5090e2 Initial load duke parents: diff changeset	1510	Node *bol = iff->in(1);
489c9b5090e2 Initial load duke parents: diff changeset	1511	if( bol && bol->req() > 1 && bol->in(1) &&
489c9b5090e2 Initial load duke parents: diff changeset	1512	((bol->in(1)->Opcode() == Op_StorePConditional ) \|\|
489c9b5090e2 Initial load duke parents: diff changeset	1513	(bol->in(1)->Opcode() == Op_StoreLConditional ) \|\|
489c9b5090e2 Initial load duke parents: diff changeset	1514	(bol->in(1)->Opcode() == Op_CompareAndSwapI ) \|\|
489c9b5090e2 Initial load duke parents: diff changeset	1515	(bol->in(1)->Opcode() == Op_CompareAndSwapL ) \|\|
489c9b5090e2 Initial load duke parents: diff changeset	1516	(bol->in(1)->Opcode() == Op_CompareAndSwapP )))
489c9b5090e2 Initial load duke parents: diff changeset	1517	return; // Allocation loops RARELY take backedge
489c9b5090e2 Initial load duke parents: diff changeset	1518	// Find the OTHER exit path from the IF
489c9b5090e2 Initial load duke parents: diff changeset	1519	Node* ex = iff->proj_out(1-test_con);
489c9b5090e2 Initial load duke parents: diff changeset	1520	float p = iff->_prob;
489c9b5090e2 Initial load duke parents: diff changeset	1521	if( !phase->is_member( this, ex ) && iff->_fcnt == COUNT_UNKNOWN ) {
489c9b5090e2 Initial load duke parents: diff changeset	1522	if( top == Op_IfTrue ) {
489c9b5090e2 Initial load duke parents: diff changeset	1523	if( p < (PROB_FAIR + PROB_UNLIKELY_MAG(3))) {
489c9b5090e2 Initial load duke parents: diff changeset	1524	iff->_prob = PROB_STATIC_FREQUENT;
489c9b5090e2 Initial load duke parents: diff changeset	1525	}
489c9b5090e2 Initial load duke parents: diff changeset	1526	} else {
489c9b5090e2 Initial load duke parents: diff changeset	1527	if( p > (PROB_FAIR - PROB_UNLIKELY_MAG(3))) {
489c9b5090e2 Initial load duke parents: diff changeset	1528	iff->_prob = PROB_STATIC_INFREQUENT;
489c9b5090e2 Initial load duke parents: diff changeset	1529	}
489c9b5090e2 Initial load duke parents: diff changeset	1530	}
489c9b5090e2 Initial load duke parents: diff changeset	1531	}
489c9b5090e2 Initial load duke parents: diff changeset	1532	}
489c9b5090e2 Initial load duke parents: diff changeset	1533	}
489c9b5090e2 Initial load duke parents: diff changeset	1534	test = phase->idom(test);
489c9b5090e2 Initial load duke parents: diff changeset	1535	}
489c9b5090e2 Initial load duke parents: diff changeset	1536	}
489c9b5090e2 Initial load duke parents: diff changeset	1537
489c9b5090e2 Initial load duke parents: diff changeset	1538
489c9b5090e2 Initial load duke parents: diff changeset	1539	//------------------------------policy_do_remove_empty_loop--------------------
489c9b5090e2 Initial load duke parents: diff changeset	1540	// Micro-benchmark spamming. Policy is to always remove empty loops.
489c9b5090e2 Initial load duke parents: diff changeset	1541	// The 'DO' part is to replace the trip counter with the value it will
489c9b5090e2 Initial load duke parents: diff changeset	1542	// have on the last iteration. This will break the loop.
489c9b5090e2 Initial load duke parents: diff changeset	1543	bool IdealLoopTree::policy_do_remove_empty_loop( PhaseIdealLoop *phase ) {
489c9b5090e2 Initial load duke parents: diff changeset	1544	// Minimum size must be empty loop
489c9b5090e2 Initial load duke parents: diff changeset	1545	if( _body.size() > 7/number of nodes in an empty loop/ ) return false;
489c9b5090e2 Initial load duke parents: diff changeset	1546
489c9b5090e2 Initial load duke parents: diff changeset	1547	if( !_head->is_CountedLoop() ) return false; // Dead loop
489c9b5090e2 Initial load duke parents: diff changeset	1548	CountedLoopNode *cl = _head->as_CountedLoop();
489c9b5090e2 Initial load duke parents: diff changeset	1549	if( !cl->loopexit() ) return false; // Malformed loop
489c9b5090e2 Initial load duke parents: diff changeset	1550	if( !phase->is_member(this,phase->get_ctrl(cl->loopexit()->in(CountedLoopEndNode::TestValue)) ) )
489c9b5090e2 Initial load duke parents: diff changeset	1551	return false; // Infinite loop
489c9b5090e2 Initial load duke parents: diff changeset	1552	#ifndef PRODUCT
489c9b5090e2 Initial load duke parents: diff changeset	1553	if( PrintOpto )
489c9b5090e2 Initial load duke parents: diff changeset	1554	tty->print_cr("Removing empty loop");
489c9b5090e2 Initial load duke parents: diff changeset	1555	#endif
489c9b5090e2 Initial load duke parents: diff changeset	1556	#ifdef ASSERT
489c9b5090e2 Initial load duke parents: diff changeset	1557	// Ensure only one phi which is the iv.
489c9b5090e2 Initial load duke parents: diff changeset	1558	Node* iv = NULL;
489c9b5090e2 Initial load duke parents: diff changeset	1559	for (DUIterator_Fast imax, i = cl->fast_outs(imax); i < imax; i++) {
489c9b5090e2 Initial load duke parents: diff changeset	1560	Node* n = cl->fast_out(i);
489c9b5090e2 Initial load duke parents: diff changeset	1561	if (n->Opcode() == Op_Phi) {
489c9b5090e2 Initial load duke parents: diff changeset	1562	assert(iv == NULL, "Too many phis" );
489c9b5090e2 Initial load duke parents: diff changeset	1563	iv = n;
489c9b5090e2 Initial load duke parents: diff changeset	1564	}
489c9b5090e2 Initial load duke parents: diff changeset	1565	}
489c9b5090e2 Initial load duke parents: diff changeset	1566	assert(iv == cl->phi(), "Wrong phi" );
489c9b5090e2 Initial load duke parents: diff changeset	1567	#endif
489c9b5090e2 Initial load duke parents: diff changeset	1568	// Replace the phi at loop head with the final value of the last
489c9b5090e2 Initial load duke parents: diff changeset	1569	// iteration. Then the CountedLoopEnd will collapse (backedge never
489c9b5090e2 Initial load duke parents: diff changeset	1570	// taken) and all loop-invariant uses of the exit values will be correct.
489c9b5090e2 Initial load duke parents: diff changeset	1571	Node *phi = cl->phi();
489c9b5090e2 Initial load duke parents: diff changeset	1572	Node *final = new (phase->C, 3) SubINode( cl->limit(), cl->stride() );
489c9b5090e2 Initial load duke parents: diff changeset	1573	phase->register_new_node(final,cl->in(LoopNode::EntryControl));
489c9b5090e2 Initial load duke parents: diff changeset	1574	phase->_igvn.hash_delete(phi);
489c9b5090e2 Initial load duke parents: diff changeset	1575	phase->_igvn.subsume_node(phi,final);
489c9b5090e2 Initial load duke parents: diff changeset	1576	phase->C->set_major_progress();
489c9b5090e2 Initial load duke parents: diff changeset	1577	return true;
489c9b5090e2 Initial load duke parents: diff changeset	1578	}
489c9b5090e2 Initial load duke parents: diff changeset	1579
489c9b5090e2 Initial load duke parents: diff changeset	1580
489c9b5090e2 Initial load duke parents: diff changeset	1581	//=============================================================================
489c9b5090e2 Initial load duke parents: diff changeset	1582	//------------------------------iteration_split_impl---------------------------
489c9b5090e2 Initial load duke parents: diff changeset	1583	void IdealLoopTree::iteration_split_impl( PhaseIdealLoop *phase, Node_List &old_new ) {
489c9b5090e2 Initial load duke parents: diff changeset	1584	// Check and remove empty loops (spam micro-benchmarks)
489c9b5090e2 Initial load duke parents: diff changeset	1585	if( policy_do_remove_empty_loop(phase) )
489c9b5090e2 Initial load duke parents: diff changeset	1586	return; // Here we removed an empty loop
489c9b5090e2 Initial load duke parents: diff changeset	1587
489c9b5090e2 Initial load duke parents: diff changeset	1588	bool should_peel = policy_peeling(phase); // Should we peel?
489c9b5090e2 Initial load duke parents: diff changeset	1589
489c9b5090e2 Initial load duke parents: diff changeset	1590	bool should_unswitch = policy_unswitching(phase);
489c9b5090e2 Initial load duke parents: diff changeset	1591
489c9b5090e2 Initial load duke parents: diff changeset	1592	// Non-counted loops may be peeled; exactly 1 iteration is peeled.
489c9b5090e2 Initial load duke parents: diff changeset	1593	// This removes loop-invariant tests (usually null checks).
489c9b5090e2 Initial load duke parents: diff changeset	1594	if( !_head->is_CountedLoop() ) { // Non-counted loop
489c9b5090e2 Initial load duke parents: diff changeset	1595	if (PartialPeelLoop && phase->partial_peel(this, old_new)) {
489c9b5090e2 Initial load duke parents: diff changeset	1596	return;
489c9b5090e2 Initial load duke parents: diff changeset	1597	}
489c9b5090e2 Initial load duke parents: diff changeset	1598	if( should_peel ) { // Should we peel?
489c9b5090e2 Initial load duke parents: diff changeset	1599	#ifndef PRODUCT
489c9b5090e2 Initial load duke parents: diff changeset	1600	if (PrintOpto) tty->print_cr("should_peel");
489c9b5090e2 Initial load duke parents: diff changeset	1601	#endif
489c9b5090e2 Initial load duke parents: diff changeset	1602	phase->do_peeling(this,old_new);
489c9b5090e2 Initial load duke parents: diff changeset	1603	} else if( should_unswitch ) {
489c9b5090e2 Initial load duke parents: diff changeset	1604	phase->do_unswitching(this, old_new);
489c9b5090e2 Initial load duke parents: diff changeset	1605	}
489c9b5090e2 Initial load duke parents: diff changeset	1606	return;
489c9b5090e2 Initial load duke parents: diff changeset	1607	}
489c9b5090e2 Initial load duke parents: diff changeset	1608	CountedLoopNode *cl = _head->as_CountedLoop();
489c9b5090e2 Initial load duke parents: diff changeset	1609
489c9b5090e2 Initial load duke parents: diff changeset	1610	if( !cl->loopexit() ) return; // Ignore various kinds of broken loops
489c9b5090e2 Initial load duke parents: diff changeset	1611
489c9b5090e2 Initial load duke parents: diff changeset	1612	// Do nothing special to pre- and post- loops
489c9b5090e2 Initial load duke parents: diff changeset	1613	if( cl->is_pre_loop() \|\| cl->is_post_loop() ) return;
489c9b5090e2 Initial load duke parents: diff changeset	1614
489c9b5090e2 Initial load duke parents: diff changeset	1615	// Compute loop trip count from profile data
489c9b5090e2 Initial load duke parents: diff changeset	1616	compute_profile_trip_cnt(phase);
489c9b5090e2 Initial load duke parents: diff changeset	1617
489c9b5090e2 Initial load duke parents: diff changeset	1618	// Before attempting fancy unrolling, RCE or alignment, see if we want
489c9b5090e2 Initial load duke parents: diff changeset	1619	// to completely unroll this loop or do loop unswitching.
489c9b5090e2 Initial load duke parents: diff changeset	1620	if( cl->is_normal_loop() ) {
489c9b5090e2 Initial load duke parents: diff changeset	1621	bool should_maximally_unroll = policy_maximally_unroll(phase);
489c9b5090e2 Initial load duke parents: diff changeset	1622	if( should_maximally_unroll ) {
489c9b5090e2 Initial load duke parents: diff changeset	1623	// Here we did some unrolling and peeling. Eventually we will
489c9b5090e2 Initial load duke parents: diff changeset	1624	// completely unroll this loop and it will no longer be a loop.
489c9b5090e2 Initial load duke parents: diff changeset	1625	phase->do_maximally_unroll(this,old_new);
489c9b5090e2 Initial load duke parents: diff changeset	1626	return;
489c9b5090e2 Initial load duke parents: diff changeset	1627	}
489c9b5090e2 Initial load duke parents: diff changeset	1628	if (should_unswitch) {
489c9b5090e2 Initial load duke parents: diff changeset	1629	phase->do_unswitching(this, old_new);
489c9b5090e2 Initial load duke parents: diff changeset	1630	return;
489c9b5090e2 Initial load duke parents: diff changeset	1631	}
489c9b5090e2 Initial load duke parents: diff changeset	1632	}
489c9b5090e2 Initial load duke parents: diff changeset	1633
489c9b5090e2 Initial load duke parents: diff changeset	1634
489c9b5090e2 Initial load duke parents: diff changeset	1635	// Counted loops may be peeled, may need some iterations run up
489c9b5090e2 Initial load duke parents: diff changeset	1636	// front for RCE, and may want to align loop refs to a cache
489c9b5090e2 Initial load duke parents: diff changeset	1637	// line. Thus we clone a full loop up front whose trip count is
489c9b5090e2 Initial load duke parents: diff changeset	1638	// at least 1 (if peeling), but may be several more.
489c9b5090e2 Initial load duke parents: diff changeset	1639
489c9b5090e2 Initial load duke parents: diff changeset	1640	// The main loop will start cache-line aligned with at least 1
489c9b5090e2 Initial load duke parents: diff changeset	1641	// iteration of the unrolled body (zero-trip test required) and
489c9b5090e2 Initial load duke parents: diff changeset	1642	// will have some range checks removed.
489c9b5090e2 Initial load duke parents: diff changeset	1643
489c9b5090e2 Initial load duke parents: diff changeset	1644	// A post-loop will finish any odd iterations (leftover after
489c9b5090e2 Initial load duke parents: diff changeset	1645	// unrolling), plus any needed for RCE purposes.
489c9b5090e2 Initial load duke parents: diff changeset	1646
489c9b5090e2 Initial load duke parents: diff changeset	1647	bool should_unroll = policy_unroll(phase);
489c9b5090e2 Initial load duke parents: diff changeset	1648
489c9b5090e2 Initial load duke parents: diff changeset	1649	bool should_rce = policy_range_check(phase);
489c9b5090e2 Initial load duke parents: diff changeset	1650
489c9b5090e2 Initial load duke parents: diff changeset	1651	bool should_align = policy_align(phase);
489c9b5090e2 Initial load duke parents: diff changeset	1652
489c9b5090e2 Initial load duke parents: diff changeset	1653	// If not RCE'ing (iteration splitting) or Aligning, then we do not
489c9b5090e2 Initial load duke parents: diff changeset	1654	// need a pre-loop. We may still need to peel an initial iteration but
489c9b5090e2 Initial load duke parents: diff changeset	1655	// we will not be needing an unknown number of pre-iterations.
489c9b5090e2 Initial load duke parents: diff changeset	1656	//
489c9b5090e2 Initial load duke parents: diff changeset	1657	// Basically, if may_rce_align reports FALSE first time through,
489c9b5090e2 Initial load duke parents: diff changeset	1658	// we will not be able to later do RCE or Aligning on this loop.
489c9b5090e2 Initial load duke parents: diff changeset	1659	bool may_rce_align = !policy_peel_only(phase) \|\| should_rce \|\| should_align;
489c9b5090e2 Initial load duke parents: diff changeset	1660
489c9b5090e2 Initial load duke parents: diff changeset	1661	// If we have any of these conditions (RCE, alignment, unrolling) met, then
489c9b5090e2 Initial load duke parents: diff changeset	1662	// we switch to the pre-/main-/post-loop model. This model also covers
489c9b5090e2 Initial load duke parents: diff changeset	1663	// peeling.
489c9b5090e2 Initial load duke parents: diff changeset	1664	if( should_rce \|\| should_align \|\| should_unroll ) {
489c9b5090e2 Initial load duke parents: diff changeset	1665	if( cl->is_normal_loop() ) // Convert to 'pre/main/post' loops
489c9b5090e2 Initial load duke parents: diff changeset	1666	phase->insert_pre_post_loops(this,old_new, !may_rce_align);
489c9b5090e2 Initial load duke parents: diff changeset	1667
489c9b5090e2 Initial load duke parents: diff changeset	1668	// Adjust the pre- and main-loop limits to let the pre and post loops run
489c9b5090e2 Initial load duke parents: diff changeset	1669	// with full checks, but the main-loop with no checks. Remove said
489c9b5090e2 Initial load duke parents: diff changeset	1670	// checks from the main body.
489c9b5090e2 Initial load duke parents: diff changeset	1671	if( should_rce )
489c9b5090e2 Initial load duke parents: diff changeset	1672	phase->do_range_check(this,old_new);
489c9b5090e2 Initial load duke parents: diff changeset	1673
489c9b5090e2 Initial load duke parents: diff changeset	1674	// Double loop body for unrolling. Adjust the minimum-trip test (will do
489c9b5090e2 Initial load duke parents: diff changeset	1675	// twice as many iterations as before) and the main body limit (only do
489c9b5090e2 Initial load duke parents: diff changeset	1676	// an even number of trips). If we are peeling, we might enable some RCE
489c9b5090e2 Initial load duke parents: diff changeset	1677	// and we'd rather unroll the post-RCE'd loop SO... do not unroll if
489c9b5090e2 Initial load duke parents: diff changeset	1678	// peeling.
489c9b5090e2 Initial load duke parents: diff changeset	1679	if( should_unroll && !should_peel )
489c9b5090e2 Initial load duke parents: diff changeset	1680	phase->do_unroll(this,old_new, true);
489c9b5090e2 Initial load duke parents: diff changeset	1681
489c9b5090e2 Initial load duke parents: diff changeset	1682	// Adjust the pre-loop limits to align the main body
489c9b5090e2 Initial load duke parents: diff changeset	1683	// iterations.
489c9b5090e2 Initial load duke parents: diff changeset	1684	if( should_align )
489c9b5090e2 Initial load duke parents: diff changeset	1685	Unimplemented();
489c9b5090e2 Initial load duke parents: diff changeset	1686
489c9b5090e2 Initial load duke parents: diff changeset	1687	} else { // Else we have an unchanged counted loop
489c9b5090e2 Initial load duke parents: diff changeset	1688	if( should_peel ) // Might want to peel but do nothing else
489c9b5090e2 Initial load duke parents: diff changeset	1689	phase->do_peeling(this,old_new);
489c9b5090e2 Initial load duke parents: diff changeset	1690	}
489c9b5090e2 Initial load duke parents: diff changeset	1691	}
489c9b5090e2 Initial load duke parents: diff changeset	1692
489c9b5090e2 Initial load duke parents: diff changeset	1693
489c9b5090e2 Initial load duke parents: diff changeset	1694	//=============================================================================
489c9b5090e2 Initial load duke parents: diff changeset	1695	//------------------------------iteration_split--------------------------------
489c9b5090e2 Initial load duke parents: diff changeset	1696	void IdealLoopTree::iteration_split( PhaseIdealLoop *phase, Node_List &old_new ) {
489c9b5090e2 Initial load duke parents: diff changeset	1697	// Recursively iteration split nested loops
489c9b5090e2 Initial load duke parents: diff changeset	1698	if( _child ) _child->iteration_split( phase, old_new );
489c9b5090e2 Initial load duke parents: diff changeset	1699
489c9b5090e2 Initial load duke parents: diff changeset	1700	// Clean out prior deadwood
489c9b5090e2 Initial load duke parents: diff changeset	1701	DCE_loop_body();
489c9b5090e2 Initial load duke parents: diff changeset	1702
489c9b5090e2 Initial load duke parents: diff changeset	1703
489c9b5090e2 Initial load duke parents: diff changeset	1704	// Look for loop-exit tests with my 50/50 guesses from the Parsing stage.
489c9b5090e2 Initial load duke parents: diff changeset	1705	// Replace with a 1-in-10 exit guess.
489c9b5090e2 Initial load duke parents: diff changeset	1706	if( _parent /not the root loop/ &&
489c9b5090e2 Initial load duke parents: diff changeset	1707	!_irreducible &&
489c9b5090e2 Initial load duke parents: diff changeset	1708	// Also ignore the occasional dead backedge
489c9b5090e2 Initial load duke parents: diff changeset	1709	!tail()->is_top() ) {
489c9b5090e2 Initial load duke parents: diff changeset	1710	adjust_loop_exit_prob(phase);
489c9b5090e2 Initial load duke parents: diff changeset	1711	}
489c9b5090e2 Initial load duke parents: diff changeset	1712
489c9b5090e2 Initial load duke parents: diff changeset	1713
489c9b5090e2 Initial load duke parents: diff changeset	1714	// Gate unrolling, RCE and peeling efforts.
489c9b5090e2 Initial load duke parents: diff changeset	1715	if( !_child && // If not an inner loop, do not split
489c9b5090e2 Initial load duke parents: diff changeset	1716	!_irreducible &&
489c9b5090e2 Initial load duke parents: diff changeset	1717	!tail()->is_top() ) { // Also ignore the occasional dead backedge
489c9b5090e2 Initial load duke parents: diff changeset	1718	if (!_has_call) {
489c9b5090e2 Initial load duke parents: diff changeset	1719	iteration_split_impl( phase, old_new );
489c9b5090e2 Initial load duke parents: diff changeset	1720	} else if (policy_unswitching(phase)) {
489c9b5090e2 Initial load duke parents: diff changeset	1721	phase->do_unswitching(this, old_new);
489c9b5090e2 Initial load duke parents: diff changeset	1722	}
489c9b5090e2 Initial load duke parents: diff changeset	1723	}
489c9b5090e2 Initial load duke parents: diff changeset	1724
489c9b5090e2 Initial load duke parents: diff changeset	1725	// Minor offset re-organization to remove loop-fallout uses of
489c9b5090e2 Initial load duke parents: diff changeset	1726	// trip counter.
489c9b5090e2 Initial load duke parents: diff changeset	1727	if( _head->is_CountedLoop() ) phase->reorg_offsets( this );
489c9b5090e2 Initial load duke parents: diff changeset	1728	if( _next ) _next->iteration_split( phase, old_new );
489c9b5090e2 Initial load duke parents: diff changeset	1729	}

author	duke
	Sat, 01 Dec 2007 00:00:00 +0000
changeset 1	489c9b5090e2
child 212	cd4963e67949
permissions	-rw-r--r--