author | roland |
Fri, 13 Jul 2018 15:44:54 +0200 | |
changeset 51085 | ad9d95f1a1f6 |
parent 51078 | fc6cfe40e32a |
child 51333 | f6641fcf7b7e |
permissions | -rw-r--r-- |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
1 |
/* |
50180 | 2 |
* Copyright (c) 2016, 2018, Oracle and/or its affiliates. All rights reserved. |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
3 |
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
4 |
* |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
5 |
* This code is free software; you can redistribute it and/or modify it |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
6 |
* under the terms of the GNU General Public License version 2 only, as |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
7 |
* published by the Free Software Foundation. |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
8 |
* |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
9 |
* This code is distributed in the hope that it will be useful, but WITHOUT |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
10 |
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
11 |
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
12 |
* version 2 for more details (a copy is included in the LICENSE file that |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
13 |
* accompanied this code). |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
14 |
* |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
15 |
* You should have received a copy of the GNU General Public License version |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
16 |
* 2 along with this work; if not, write to the Free Software Foundation, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
17 |
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
18 |
* |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
19 |
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
20 |
* or visit www.oracle.com if you need additional information or have any |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
21 |
* questions. |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
22 |
* |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
23 |
*/ |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
24 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
25 |
#include "precompiled.hpp" |
50180 | 26 |
#include "gc/shared/barrierSet.hpp" |
27 |
#include "gc/shared/c2/barrierSetC2.hpp" |
|
28 |
#include "gc/shared/c2/cardTableBarrierSetC2.hpp" |
|
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
29 |
#include "opto/arraycopynode.hpp" |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
30 |
#include "opto/graphKit.hpp" |
45427
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
31 |
#include "runtime/sharedRuntime.hpp" |
50180 | 32 |
#include "utilities/macros.hpp" |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
33 |
|
42086
feac795f345d
8159611: C2: ArrayCopy elimination skips required parameter checks
simonis
parents:
40365
diff
changeset
|
34 |
ArrayCopyNode::ArrayCopyNode(Compile* C, bool alloc_tightly_coupled, bool has_negative_length_guard) |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
35 |
: CallNode(arraycopy_type(), NULL, TypeRawPtr::BOTTOM), |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
36 |
_alloc_tightly_coupled(alloc_tightly_coupled), |
42086
feac795f345d
8159611: C2: ArrayCopy elimination skips required parameter checks
simonis
parents:
40365
diff
changeset
|
37 |
_has_negative_length_guard(has_negative_length_guard), |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
38 |
_kind(None), |
30629
b6e5ad2f18d5
8076188: Optimize arraycopy out for non escaping destination
roland
parents:
29360
diff
changeset
|
39 |
_arguments_validated(false), |
b6e5ad2f18d5
8076188: Optimize arraycopy out for non escaping destination
roland
parents:
29360
diff
changeset
|
40 |
_src_type(TypeOopPtr::BOTTOM), |
b6e5ad2f18d5
8076188: Optimize arraycopy out for non escaping destination
roland
parents:
29360
diff
changeset
|
41 |
_dest_type(TypeOopPtr::BOTTOM) { |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
42 |
init_class_id(Class_ArrayCopy); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
43 |
init_flags(Flag_is_macro); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
44 |
C->add_macro_node(this); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
45 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
46 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
47 |
uint ArrayCopyNode::size_of() const { return sizeof(*this); } |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
48 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
49 |
ArrayCopyNode* ArrayCopyNode::make(GraphKit* kit, bool may_throw, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
50 |
Node* src, Node* src_offset, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
51 |
Node* dest, Node* dest_offset, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
52 |
Node* length, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
53 |
bool alloc_tightly_coupled, |
42086
feac795f345d
8159611: C2: ArrayCopy elimination skips required parameter checks
simonis
parents:
40365
diff
changeset
|
54 |
bool has_negative_length_guard, |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
55 |
Node* src_klass, Node* dest_klass, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
56 |
Node* src_length, Node* dest_length) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
57 |
|
42086
feac795f345d
8159611: C2: ArrayCopy elimination skips required parameter checks
simonis
parents:
40365
diff
changeset
|
58 |
ArrayCopyNode* ac = new ArrayCopyNode(kit->C, alloc_tightly_coupled, has_negative_length_guard); |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
59 |
Node* prev_mem = kit->set_predefined_input_for_runtime_call(ac); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
60 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
61 |
ac->init_req(ArrayCopyNode::Src, src); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
62 |
ac->init_req(ArrayCopyNode::SrcPos, src_offset); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
63 |
ac->init_req(ArrayCopyNode::Dest, dest); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
64 |
ac->init_req(ArrayCopyNode::DestPos, dest_offset); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
65 |
ac->init_req(ArrayCopyNode::Length, length); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
66 |
ac->init_req(ArrayCopyNode::SrcLen, src_length); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
67 |
ac->init_req(ArrayCopyNode::DestLen, dest_length); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
68 |
ac->init_req(ArrayCopyNode::SrcKlass, src_klass); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
69 |
ac->init_req(ArrayCopyNode::DestKlass, dest_klass); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
70 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
71 |
if (may_throw) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
72 |
ac->set_req(TypeFunc::I_O , kit->i_o()); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
73 |
kit->add_safepoint_edges(ac, false); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
74 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
75 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
76 |
return ac; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
77 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
78 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
79 |
void ArrayCopyNode::connect_outputs(GraphKit* kit) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
80 |
kit->set_all_memory_call(this, true); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
81 |
kit->set_control(kit->gvn().transform(new ProjNode(this,TypeFunc::Control))); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
82 |
kit->set_i_o(kit->gvn().transform(new ProjNode(this, TypeFunc::I_O))); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
83 |
kit->make_slow_call_ex(this, kit->env()->Throwable_klass(), true); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
84 |
kit->set_all_memory_call(this); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
85 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
86 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
87 |
#ifndef PRODUCT |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
88 |
const char* ArrayCopyNode::_kind_names[] = {"arraycopy", "arraycopy, validated arguments", "clone", "oop array clone", "CopyOf", "CopyOfRange"}; |
32084
7743e6943cdf
8004073: Implement C2 Ideal node specific dump() method
mhaupt
parents:
31233
diff
changeset
|
89 |
|
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
90 |
void ArrayCopyNode::dump_spec(outputStream *st) const { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
91 |
CallNode::dump_spec(st); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
92 |
st->print(" (%s%s)", _kind_names[_kind], _alloc_tightly_coupled ? ", tightly coupled allocation" : ""); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
93 |
} |
32084
7743e6943cdf
8004073: Implement C2 Ideal node specific dump() method
mhaupt
parents:
31233
diff
changeset
|
94 |
|
7743e6943cdf
8004073: Implement C2 Ideal node specific dump() method
mhaupt
parents:
31233
diff
changeset
|
95 |
void ArrayCopyNode::dump_compact_spec(outputStream* st) const { |
7743e6943cdf
8004073: Implement C2 Ideal node specific dump() method
mhaupt
parents:
31233
diff
changeset
|
96 |
st->print("%s%s", _kind_names[_kind], _alloc_tightly_coupled ? ",tight" : ""); |
7743e6943cdf
8004073: Implement C2 Ideal node specific dump() method
mhaupt
parents:
31233
diff
changeset
|
97 |
} |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
98 |
#endif |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
99 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
100 |
intptr_t ArrayCopyNode::get_length_if_constant(PhaseGVN *phase) const { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
101 |
// check that length is constant |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
102 |
Node* length = in(ArrayCopyNode::Length); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
103 |
const Type* length_type = phase->type(length); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
104 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
105 |
if (length_type == Type::TOP) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
106 |
return -1; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
107 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
108 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
109 |
assert(is_clonebasic() || is_arraycopy() || is_copyof() || is_copyofrange(), "unexpected array copy type"); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
110 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
111 |
return is_clonebasic() ? length->find_intptr_t_con(-1) : length->find_int_con(-1); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
112 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
113 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
114 |
int ArrayCopyNode::get_count(PhaseGVN *phase) const { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
115 |
Node* src = in(ArrayCopyNode::Src); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
116 |
const Type* src_type = phase->type(src); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
117 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
118 |
if (is_clonebasic()) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
119 |
if (src_type->isa_instptr()) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
120 |
const TypeInstPtr* inst_src = src_type->is_instptr(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
121 |
ciInstanceKlass* ik = inst_src->klass()->as_instance_klass(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
122 |
// ciInstanceKlass::nof_nonstatic_fields() doesn't take injected |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
123 |
// fields into account. They are rare anyway so easier to simply |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
124 |
// skip instances with injected fields. |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
125 |
if ((!inst_src->klass_is_exact() && (ik->is_interface() || ik->has_subklass())) || ik->has_injected_fields()) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
126 |
return -1; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
127 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
128 |
int nb_fields = ik->nof_nonstatic_fields(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
129 |
return nb_fields; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
130 |
} else { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
131 |
const TypeAryPtr* ary_src = src_type->isa_aryptr(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
132 |
assert (ary_src != NULL, "not an array or instance?"); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
133 |
// clone passes a length as a rounded number of longs. If we're |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
134 |
// cloning an array we'll do it element by element. If the |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
135 |
// length input to ArrayCopyNode is constant, length of input |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
136 |
// array must be too. |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
137 |
|
29345
e8f6ba59748f
8073792: assert((get_length_if_constant(phase) == -1) == !ary_src->size()->is_con()) failed: inconsistent
roland
parents:
29340
diff
changeset
|
138 |
assert((get_length_if_constant(phase) == -1) == !ary_src->size()->is_con() || |
e8f6ba59748f
8073792: assert((get_length_if_constant(phase) == -1) == !ary_src->size()->is_con()) failed: inconsistent
roland
parents:
29340
diff
changeset
|
139 |
phase->is_IterGVN(), "inconsistent"); |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
140 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
141 |
if (ary_src->size()->is_con()) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
142 |
return ary_src->size()->get_con(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
143 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
144 |
return -1; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
145 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
146 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
147 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
148 |
return get_length_if_constant(phase); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
149 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
150 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
151 |
Node* ArrayCopyNode::try_clone_instance(PhaseGVN *phase, bool can_reshape, int count) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
152 |
if (!is_clonebasic()) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
153 |
return NULL; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
154 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
155 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
156 |
Node* src = in(ArrayCopyNode::Src); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
157 |
Node* dest = in(ArrayCopyNode::Dest); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
158 |
Node* ctl = in(TypeFunc::Control); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
159 |
Node* in_mem = in(TypeFunc::Memory); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
160 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
161 |
const Type* src_type = phase->type(src); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
162 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
163 |
assert(src->is_AddP(), "should be base + off"); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
164 |
assert(dest->is_AddP(), "should be base + off"); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
165 |
Node* base_src = src->in(AddPNode::Base); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
166 |
Node* base_dest = dest->in(AddPNode::Base); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
167 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
168 |
MergeMemNode* mem = MergeMemNode::make(in_mem); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
169 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
170 |
const TypeInstPtr* inst_src = src_type->isa_instptr(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
171 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
172 |
if (inst_src == NULL) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
173 |
return NULL; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
174 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
175 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
176 |
if (!inst_src->klass_is_exact()) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
177 |
ciInstanceKlass* ik = inst_src->klass()->as_instance_klass(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
178 |
assert(!ik->is_interface() && !ik->has_subklass(), "inconsistent klass hierarchy"); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
179 |
phase->C->dependencies()->assert_leaf_type(ik); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
180 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
181 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
182 |
ciInstanceKlass* ik = inst_src->klass()->as_instance_klass(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
183 |
assert(ik->nof_nonstatic_fields() <= ArrayCopyLoadStoreMaxElem, "too many fields"); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
184 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
185 |
for (int i = 0; i < count; i++) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
186 |
ciField* field = ik->nonstatic_field_at(i); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
187 |
int fieldidx = phase->C->alias_type(field)->index(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
188 |
const TypePtr* adr_type = phase->C->alias_type(field)->adr_type(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
189 |
Node* off = phase->MakeConX(field->offset()); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
190 |
Node* next_src = phase->transform(new AddPNode(base_src,base_src,off)); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
191 |
Node* next_dest = phase->transform(new AddPNode(base_dest,base_dest,off)); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
192 |
BasicType bt = field->layout_type(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
193 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
194 |
const Type *type; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
195 |
if (bt == T_OBJECT) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
196 |
if (!field->type()->is_loaded()) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
197 |
type = TypeInstPtr::BOTTOM; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
198 |
} else { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
199 |
ciType* field_klass = field->type(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
200 |
type = TypeOopPtr::make_from_klass(field_klass->as_klass()); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
201 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
202 |
} else { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
203 |
type = Type::get_const_basic_type(bt); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
204 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
205 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
206 |
Node* v = LoadNode::make(*phase, ctl, mem->memory_at(fieldidx), next_src, adr_type, type, bt, MemNode::unordered); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
207 |
v = phase->transform(v); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
208 |
Node* s = StoreNode::make(*phase, ctl, mem->memory_at(fieldidx), next_dest, adr_type, v, bt, MemNode::unordered); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
209 |
s = phase->transform(s); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
210 |
mem->set_memory_at(fieldidx, s); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
211 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
212 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
213 |
if (!finish_transform(phase, can_reshape, ctl, mem)) { |
39254
fb4492288b01
8156760: VM crashes if -XX:-ReduceInitialCardMarks is set
thartmann
parents:
32576
diff
changeset
|
214 |
// Return NodeSentinel to indicate that the transform failed |
fb4492288b01
8156760: VM crashes if -XX:-ReduceInitialCardMarks is set
thartmann
parents:
32576
diff
changeset
|
215 |
return NodeSentinel; |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
216 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
217 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
218 |
return mem; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
219 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
220 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
221 |
bool ArrayCopyNode::prepare_array_copy(PhaseGVN *phase, bool can_reshape, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
222 |
Node*& adr_src, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
223 |
Node*& base_src, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
224 |
Node*& adr_dest, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
225 |
Node*& base_dest, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
226 |
BasicType& copy_type, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
227 |
const Type*& value_type, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
228 |
bool& disjoint_bases) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
229 |
Node* src = in(ArrayCopyNode::Src); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
230 |
Node* dest = in(ArrayCopyNode::Dest); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
231 |
const Type* src_type = phase->type(src); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
232 |
const TypeAryPtr* ary_src = src_type->isa_aryptr(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
233 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
234 |
if (is_arraycopy() || is_copyofrange() || is_copyof()) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
235 |
const Type* dest_type = phase->type(dest); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
236 |
const TypeAryPtr* ary_dest = dest_type->isa_aryptr(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
237 |
Node* src_offset = in(ArrayCopyNode::SrcPos); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
238 |
Node* dest_offset = in(ArrayCopyNode::DestPos); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
239 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
240 |
// newly allocated object is guaranteed to not overlap with source object |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
241 |
disjoint_bases = is_alloc_tightly_coupled(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
242 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
243 |
if (ary_src == NULL || ary_src->klass() == NULL || |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
244 |
ary_dest == NULL || ary_dest->klass() == NULL) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
245 |
// We don't know if arguments are arrays |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
246 |
return false; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
247 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
248 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
249 |
BasicType src_elem = ary_src->klass()->as_array_klass()->element_type()->basic_type(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
250 |
BasicType dest_elem = ary_dest->klass()->as_array_klass()->element_type()->basic_type(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
251 |
if (src_elem == T_ARRAY) src_elem = T_OBJECT; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
252 |
if (dest_elem == T_ARRAY) dest_elem = T_OBJECT; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
253 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
254 |
if (src_elem != dest_elem || dest_elem == T_VOID) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
255 |
// We don't know if arguments are arrays of the same type |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
256 |
return false; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
257 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
258 |
|
50180 | 259 |
BarrierSetC2* bs = BarrierSet::barrier_set()->barrier_set_c2(); |
260 |
if (dest_elem == T_OBJECT && (!is_alloc_tightly_coupled() || |
|
261 |
bs->array_copy_requires_gc_barriers(T_OBJECT))) { |
|
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
262 |
// It's an object array copy but we can't emit the card marking |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
263 |
// that is needed |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
264 |
return false; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
265 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
266 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
267 |
value_type = ary_src->elem(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
268 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
269 |
base_src = src; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
270 |
base_dest = dest; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
271 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
272 |
uint shift = exact_log2(type2aelembytes(dest_elem)); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
273 |
uint header = arrayOopDesc::base_offset_in_bytes(dest_elem); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
274 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
275 |
adr_src = src; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
276 |
adr_dest = dest; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
277 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
278 |
src_offset = Compile::conv_I2X_index(phase, src_offset, ary_src->size()); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
279 |
dest_offset = Compile::conv_I2X_index(phase, dest_offset, ary_dest->size()); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
280 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
281 |
Node* src_scale = phase->transform(new LShiftXNode(src_offset, phase->intcon(shift))); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
282 |
Node* dest_scale = phase->transform(new LShiftXNode(dest_offset, phase->intcon(shift))); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
283 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
284 |
adr_src = phase->transform(new AddPNode(base_src, adr_src, src_scale)); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
285 |
adr_dest = phase->transform(new AddPNode(base_dest, adr_dest, dest_scale)); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
286 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
287 |
adr_src = new AddPNode(base_src, adr_src, phase->MakeConX(header)); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
288 |
adr_dest = new AddPNode(base_dest, adr_dest, phase->MakeConX(header)); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
289 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
290 |
adr_src = phase->transform(adr_src); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
291 |
adr_dest = phase->transform(adr_dest); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
292 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
293 |
copy_type = dest_elem; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
294 |
} else { |
44322
051426f34a5e
8176505: Wrong assertion 'should be an array copy/clone' in arraycopynode.cpp
simonis
parents:
42086
diff
changeset
|
295 |
assert(ary_src != NULL, "should be a clone"); |
051426f34a5e
8176505: Wrong assertion 'should be an array copy/clone' in arraycopynode.cpp
simonis
parents:
42086
diff
changeset
|
296 |
assert(is_clonebasic(), "should be"); |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
297 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
298 |
disjoint_bases = true; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
299 |
assert(src->is_AddP(), "should be base + off"); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
300 |
assert(dest->is_AddP(), "should be base + off"); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
301 |
adr_src = src; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
302 |
base_src = src->in(AddPNode::Base); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
303 |
adr_dest = dest; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
304 |
base_dest = dest->in(AddPNode::Base); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
305 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
306 |
assert(phase->type(src->in(AddPNode::Offset))->is_intptr_t()->get_con() == phase->type(dest->in(AddPNode::Offset))->is_intptr_t()->get_con(), "same start offset?"); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
307 |
BasicType elem = ary_src->klass()->as_array_klass()->element_type()->basic_type(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
308 |
if (elem == T_ARRAY) elem = T_OBJECT; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
309 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
310 |
int diff = arrayOopDesc::base_offset_in_bytes(elem) - phase->type(src->in(AddPNode::Offset))->is_intptr_t()->get_con(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
311 |
assert(diff >= 0, "clone should not start after 1st array element"); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
312 |
if (diff > 0) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
313 |
adr_src = phase->transform(new AddPNode(base_src, adr_src, phase->MakeConX(diff))); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
314 |
adr_dest = phase->transform(new AddPNode(base_dest, adr_dest, phase->MakeConX(diff))); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
315 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
316 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
317 |
copy_type = elem; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
318 |
value_type = ary_src->elem(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
319 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
320 |
return true; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
321 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
322 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
323 |
const TypePtr* ArrayCopyNode::get_address_type(PhaseGVN *phase, Node* n) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
324 |
const Type* at = phase->type(n); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
325 |
assert(at != Type::TOP, "unexpected type"); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
326 |
const TypePtr* atp = at->isa_ptr(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
327 |
// adjust atp to be the correct array element address type |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
328 |
atp = atp->add_offset(Type::OffsetBot); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
329 |
return atp; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
330 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
331 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
332 |
void ArrayCopyNode::array_copy_test_overlap(PhaseGVN *phase, bool can_reshape, bool disjoint_bases, int count, Node*& forward_ctl, Node*& backward_ctl) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
333 |
Node* ctl = in(TypeFunc::Control); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
334 |
if (!disjoint_bases && count > 1) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
335 |
Node* src_offset = in(ArrayCopyNode::SrcPos); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
336 |
Node* dest_offset = in(ArrayCopyNode::DestPos); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
337 |
assert(src_offset != NULL && dest_offset != NULL, "should be"); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
338 |
Node* cmp = phase->transform(new CmpINode(src_offset, dest_offset)); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
339 |
Node *bol = phase->transform(new BoolNode(cmp, BoolTest::lt)); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
340 |
IfNode *iff = new IfNode(ctl, bol, PROB_FAIR, COUNT_UNKNOWN); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
341 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
342 |
phase->transform(iff); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
343 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
344 |
forward_ctl = phase->transform(new IfFalseNode(iff)); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
345 |
backward_ctl = phase->transform(new IfTrueNode(iff)); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
346 |
} else { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
347 |
forward_ctl = ctl; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
348 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
349 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
350 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
351 |
Node* ArrayCopyNode::array_copy_forward(PhaseGVN *phase, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
352 |
bool can_reshape, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
353 |
Node* forward_ctl, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
354 |
Node* start_mem_src, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
355 |
Node* start_mem_dest, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
356 |
const TypePtr* atp_src, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
357 |
const TypePtr* atp_dest, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
358 |
Node* adr_src, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
359 |
Node* base_src, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
360 |
Node* adr_dest, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
361 |
Node* base_dest, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
362 |
BasicType copy_type, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
363 |
const Type* value_type, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
364 |
int count) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
365 |
Node* mem = phase->C->top(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
366 |
if (!forward_ctl->is_top()) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
367 |
// copy forward |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
368 |
mem = start_mem_dest; |
51085
ad9d95f1a1f6
8200282: Serializing non-zero byte as zero to ByteBuffer
roland
parents:
51078
diff
changeset
|
369 |
uint alias_idx_src = phase->C->get_alias_index(atp_src); |
ad9d95f1a1f6
8200282: Serializing non-zero byte as zero to ByteBuffer
roland
parents:
51078
diff
changeset
|
370 |
uint alias_idx_dest = phase->C->get_alias_index(atp_dest); |
ad9d95f1a1f6
8200282: Serializing non-zero byte as zero to ByteBuffer
roland
parents:
51078
diff
changeset
|
371 |
bool same_alias = (alias_idx_src == alias_idx_dest); |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
372 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
373 |
if (count > 0) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
374 |
Node* v = LoadNode::make(*phase, forward_ctl, start_mem_src, adr_src, atp_src, value_type, copy_type, MemNode::unordered); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
375 |
v = phase->transform(v); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
376 |
mem = StoreNode::make(*phase, forward_ctl, mem, adr_dest, atp_dest, v, copy_type, MemNode::unordered); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
377 |
mem = phase->transform(mem); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
378 |
for (int i = 1; i < count; i++) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
379 |
Node* off = phase->MakeConX(type2aelembytes(copy_type) * i); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
380 |
Node* next_src = phase->transform(new AddPNode(base_src,adr_src,off)); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
381 |
Node* next_dest = phase->transform(new AddPNode(base_dest,adr_dest,off)); |
51085
ad9d95f1a1f6
8200282: Serializing non-zero byte as zero to ByteBuffer
roland
parents:
51078
diff
changeset
|
382 |
v = LoadNode::make(*phase, forward_ctl, same_alias ? mem : start_mem_src, next_src, atp_src, value_type, copy_type, MemNode::unordered); |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
383 |
v = phase->transform(v); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
384 |
mem = StoreNode::make(*phase, forward_ctl,mem,next_dest,atp_dest,v, copy_type, MemNode::unordered); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
385 |
mem = phase->transform(mem); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
386 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
387 |
} else if(can_reshape) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
388 |
PhaseIterGVN* igvn = phase->is_IterGVN(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
389 |
igvn->_worklist.push(adr_src); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
390 |
igvn->_worklist.push(adr_dest); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
391 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
392 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
393 |
return mem; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
394 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
395 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
396 |
Node* ArrayCopyNode::array_copy_backward(PhaseGVN *phase, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
397 |
bool can_reshape, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
398 |
Node* backward_ctl, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
399 |
Node* start_mem_src, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
400 |
Node* start_mem_dest, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
401 |
const TypePtr* atp_src, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
402 |
const TypePtr* atp_dest, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
403 |
Node* adr_src, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
404 |
Node* base_src, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
405 |
Node* adr_dest, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
406 |
Node* base_dest, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
407 |
BasicType copy_type, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
408 |
const Type* value_type, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
409 |
int count) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
410 |
Node* mem = phase->C->top(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
411 |
if (!backward_ctl->is_top()) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
412 |
// copy backward |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
413 |
mem = start_mem_dest; |
51085
ad9d95f1a1f6
8200282: Serializing non-zero byte as zero to ByteBuffer
roland
parents:
51078
diff
changeset
|
414 |
uint alias_idx_src = phase->C->get_alias_index(atp_src); |
ad9d95f1a1f6
8200282: Serializing non-zero byte as zero to ByteBuffer
roland
parents:
51078
diff
changeset
|
415 |
uint alias_idx_dest = phase->C->get_alias_index(atp_dest); |
ad9d95f1a1f6
8200282: Serializing non-zero byte as zero to ByteBuffer
roland
parents:
51078
diff
changeset
|
416 |
bool same_alias = (alias_idx_src == alias_idx_dest); |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
417 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
418 |
if (count > 0) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
419 |
for (int i = count-1; i >= 1; i--) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
420 |
Node* off = phase->MakeConX(type2aelembytes(copy_type) * i); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
421 |
Node* next_src = phase->transform(new AddPNode(base_src,adr_src,off)); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
422 |
Node* next_dest = phase->transform(new AddPNode(base_dest,adr_dest,off)); |
51085
ad9d95f1a1f6
8200282: Serializing non-zero byte as zero to ByteBuffer
roland
parents:
51078
diff
changeset
|
423 |
Node* v = LoadNode::make(*phase, backward_ctl, same_alias ? mem : start_mem_src, next_src, atp_src, value_type, copy_type, MemNode::unordered); |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
424 |
v = phase->transform(v); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
425 |
mem = StoreNode::make(*phase, backward_ctl,mem,next_dest,atp_dest,v, copy_type, MemNode::unordered); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
426 |
mem = phase->transform(mem); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
427 |
} |
51085
ad9d95f1a1f6
8200282: Serializing non-zero byte as zero to ByteBuffer
roland
parents:
51078
diff
changeset
|
428 |
Node* v = LoadNode::make(*phase, backward_ctl, same_alias ? mem : start_mem_src, adr_src, atp_src, value_type, copy_type, MemNode::unordered); |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
429 |
v = phase->transform(v); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
430 |
mem = StoreNode::make(*phase, backward_ctl, mem, adr_dest, atp_dest, v, copy_type, MemNode::unordered); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
431 |
mem = phase->transform(mem); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
432 |
} else if(can_reshape) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
433 |
PhaseIterGVN* igvn = phase->is_IterGVN(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
434 |
igvn->_worklist.push(adr_src); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
435 |
igvn->_worklist.push(adr_dest); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
436 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
437 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
438 |
return mem; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
439 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
440 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
441 |
bool ArrayCopyNode::finish_transform(PhaseGVN *phase, bool can_reshape, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
442 |
Node* ctl, Node *mem) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
443 |
if (can_reshape) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
444 |
PhaseIterGVN* igvn = phase->is_IterGVN(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
445 |
igvn->set_delay_transform(false); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
446 |
if (is_clonebasic()) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
447 |
Node* out_mem = proj_out(TypeFunc::Memory); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
448 |
|
50180 | 449 |
BarrierSetC2* bs = BarrierSet::barrier_set()->barrier_set_c2(); |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
450 |
if (out_mem->outcnt() != 1 || !out_mem->raw_out(0)->is_MergeMem() || |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
451 |
out_mem->raw_out(0)->outcnt() != 1 || !out_mem->raw_out(0)->raw_out(0)->is_MemBar()) { |
50180 | 452 |
assert(bs->array_copy_requires_gc_barriers(T_OBJECT), "can only happen with card marking"); |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
453 |
return false; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
454 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
455 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
456 |
igvn->replace_node(out_mem->raw_out(0), mem); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
457 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
458 |
Node* out_ctl = proj_out(TypeFunc::Control); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
459 |
igvn->replace_node(out_ctl, ctl); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
460 |
} else { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
461 |
// replace fallthrough projections of the ArrayCopyNode by the |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
462 |
// new memory, control and the input IO. |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
463 |
CallProjections callprojs; |
31233
7033a9f3e2f1
8086016: closed/java/text/Format/NumberFormat/BigDecimalCompatibilityTest.java is crashing
roland
parents:
31044
diff
changeset
|
464 |
extract_projections(&callprojs, true, false); |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
465 |
|
31233
7033a9f3e2f1
8086016: closed/java/text/Format/NumberFormat/BigDecimalCompatibilityTest.java is crashing
roland
parents:
31044
diff
changeset
|
466 |
if (callprojs.fallthrough_ioproj != NULL) { |
7033a9f3e2f1
8086016: closed/java/text/Format/NumberFormat/BigDecimalCompatibilityTest.java is crashing
roland
parents:
31044
diff
changeset
|
467 |
igvn->replace_node(callprojs.fallthrough_ioproj, in(TypeFunc::I_O)); |
7033a9f3e2f1
8086016: closed/java/text/Format/NumberFormat/BigDecimalCompatibilityTest.java is crashing
roland
parents:
31044
diff
changeset
|
468 |
} |
7033a9f3e2f1
8086016: closed/java/text/Format/NumberFormat/BigDecimalCompatibilityTest.java is crashing
roland
parents:
31044
diff
changeset
|
469 |
if (callprojs.fallthrough_memproj != NULL) { |
7033a9f3e2f1
8086016: closed/java/text/Format/NumberFormat/BigDecimalCompatibilityTest.java is crashing
roland
parents:
31044
diff
changeset
|
470 |
igvn->replace_node(callprojs.fallthrough_memproj, mem); |
7033a9f3e2f1
8086016: closed/java/text/Format/NumberFormat/BigDecimalCompatibilityTest.java is crashing
roland
parents:
31044
diff
changeset
|
471 |
} |
7033a9f3e2f1
8086016: closed/java/text/Format/NumberFormat/BigDecimalCompatibilityTest.java is crashing
roland
parents:
31044
diff
changeset
|
472 |
if (callprojs.fallthrough_catchproj != NULL) { |
7033a9f3e2f1
8086016: closed/java/text/Format/NumberFormat/BigDecimalCompatibilityTest.java is crashing
roland
parents:
31044
diff
changeset
|
473 |
igvn->replace_node(callprojs.fallthrough_catchproj, ctl); |
7033a9f3e2f1
8086016: closed/java/text/Format/NumberFormat/BigDecimalCompatibilityTest.java is crashing
roland
parents:
31044
diff
changeset
|
474 |
} |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
475 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
476 |
// The ArrayCopyNode is not disconnected. It still has the |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
477 |
// projections for the exception case. Replace current |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
478 |
// ArrayCopyNode with a dummy new one with a top() control so |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
479 |
// that this part of the graph stays consistent but is |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
480 |
// eventually removed. |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
481 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
482 |
set_req(0, phase->C->top()); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
483 |
remove_dead_region(phase, can_reshape); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
484 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
485 |
} else { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
486 |
if (in(TypeFunc::Control) != ctl) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
487 |
// we can't return new memory and control from Ideal at parse time |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
488 |
assert(!is_clonebasic(), "added control for clone?"); |
29340
e5ee51840b93
8073624: Fix waring "converting to non-pointer type 'bool' from NULL" in arraycopynode.cpp
simonis
parents:
29337
diff
changeset
|
489 |
return false; |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
490 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
491 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
492 |
return true; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
493 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
494 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
495 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
496 |
Node *ArrayCopyNode::Ideal(PhaseGVN *phase, bool can_reshape) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
497 |
if (remove_dead_region(phase, can_reshape)) return this; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
498 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
499 |
if (StressArrayCopyMacroNode && !can_reshape) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
500 |
phase->record_for_igvn(this); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
501 |
return NULL; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
502 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
503 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
504 |
// See if it's a small array copy and we can inline it as |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
505 |
// loads/stores |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
506 |
// Here we can only do: |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
507 |
// - arraycopy if all arguments were validated before and we don't |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
508 |
// need card marking |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
509 |
// - clone for which we don't need to do card marking |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
510 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
511 |
if (!is_clonebasic() && !is_arraycopy_validated() && |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
512 |
!is_copyofrange_validated() && !is_copyof_validated()) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
513 |
return NULL; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
514 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
515 |
|
29360
dd9daceb5f3d
8073957: assert(ary_src != 0) failed: not an array or instance?
roland
parents:
29345
diff
changeset
|
516 |
assert(in(TypeFunc::Control) != NULL && |
dd9daceb5f3d
8073957: assert(ary_src != 0) failed: not an array or instance?
roland
parents:
29345
diff
changeset
|
517 |
in(TypeFunc::Memory) != NULL && |
dd9daceb5f3d
8073957: assert(ary_src != 0) failed: not an array or instance?
roland
parents:
29345
diff
changeset
|
518 |
in(ArrayCopyNode::Src) != NULL && |
dd9daceb5f3d
8073957: assert(ary_src != 0) failed: not an array or instance?
roland
parents:
29345
diff
changeset
|
519 |
in(ArrayCopyNode::Dest) != NULL && |
dd9daceb5f3d
8073957: assert(ary_src != 0) failed: not an array or instance?
roland
parents:
29345
diff
changeset
|
520 |
in(ArrayCopyNode::Length) != NULL && |
dd9daceb5f3d
8073957: assert(ary_src != 0) failed: not an array or instance?
roland
parents:
29345
diff
changeset
|
521 |
((in(ArrayCopyNode::SrcPos) != NULL && in(ArrayCopyNode::DestPos) != NULL) || |
dd9daceb5f3d
8073957: assert(ary_src != 0) failed: not an array or instance?
roland
parents:
29345
diff
changeset
|
522 |
is_clonebasic()), "broken inputs"); |
dd9daceb5f3d
8073957: assert(ary_src != 0) failed: not an array or instance?
roland
parents:
29345
diff
changeset
|
523 |
|
dd9daceb5f3d
8073957: assert(ary_src != 0) failed: not an array or instance?
roland
parents:
29345
diff
changeset
|
524 |
if (in(TypeFunc::Control)->is_top() || |
dd9daceb5f3d
8073957: assert(ary_src != 0) failed: not an array or instance?
roland
parents:
29345
diff
changeset
|
525 |
in(TypeFunc::Memory)->is_top() || |
dd9daceb5f3d
8073957: assert(ary_src != 0) failed: not an array or instance?
roland
parents:
29345
diff
changeset
|
526 |
phase->type(in(ArrayCopyNode::Src)) == Type::TOP || |
dd9daceb5f3d
8073957: assert(ary_src != 0) failed: not an array or instance?
roland
parents:
29345
diff
changeset
|
527 |
phase->type(in(ArrayCopyNode::Dest)) == Type::TOP || |
dd9daceb5f3d
8073957: assert(ary_src != 0) failed: not an array or instance?
roland
parents:
29345
diff
changeset
|
528 |
(in(ArrayCopyNode::SrcPos) != NULL && in(ArrayCopyNode::SrcPos)->is_top()) || |
dd9daceb5f3d
8073957: assert(ary_src != 0) failed: not an array or instance?
roland
parents:
29345
diff
changeset
|
529 |
(in(ArrayCopyNode::DestPos) != NULL && in(ArrayCopyNode::DestPos)->is_top())) { |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
530 |
return NULL; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
531 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
532 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
533 |
int count = get_count(phase); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
534 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
535 |
if (count < 0 || count > ArrayCopyLoadStoreMaxElem) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
536 |
return NULL; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
537 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
538 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
539 |
Node* mem = try_clone_instance(phase, can_reshape, count); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
540 |
if (mem != NULL) { |
39254
fb4492288b01
8156760: VM crashes if -XX:-ReduceInitialCardMarks is set
thartmann
parents:
32576
diff
changeset
|
541 |
return (mem == NodeSentinel) ? NULL : mem; |
29337
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
542 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
543 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
544 |
Node* adr_src = NULL; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
545 |
Node* base_src = NULL; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
546 |
Node* adr_dest = NULL; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
547 |
Node* base_dest = NULL; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
548 |
BasicType copy_type = T_ILLEGAL; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
549 |
const Type* value_type = NULL; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
550 |
bool disjoint_bases = false; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
551 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
552 |
if (!prepare_array_copy(phase, can_reshape, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
553 |
adr_src, base_src, adr_dest, base_dest, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
554 |
copy_type, value_type, disjoint_bases)) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
555 |
return NULL; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
556 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
557 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
558 |
Node* src = in(ArrayCopyNode::Src); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
559 |
Node* dest = in(ArrayCopyNode::Dest); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
560 |
const TypePtr* atp_src = get_address_type(phase, src); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
561 |
const TypePtr* atp_dest = get_address_type(phase, dest); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
562 |
uint alias_idx_src = phase->C->get_alias_index(atp_src); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
563 |
uint alias_idx_dest = phase->C->get_alias_index(atp_dest); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
564 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
565 |
Node *in_mem = in(TypeFunc::Memory); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
566 |
Node *start_mem_src = in_mem; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
567 |
Node *start_mem_dest = in_mem; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
568 |
if (in_mem->is_MergeMem()) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
569 |
start_mem_src = in_mem->as_MergeMem()->memory_at(alias_idx_src); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
570 |
start_mem_dest = in_mem->as_MergeMem()->memory_at(alias_idx_dest); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
571 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
572 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
573 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
574 |
if (can_reshape) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
575 |
assert(!phase->is_IterGVN()->delay_transform(), "cannot delay transforms"); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
576 |
phase->is_IterGVN()->set_delay_transform(true); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
577 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
578 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
579 |
Node* backward_ctl = phase->C->top(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
580 |
Node* forward_ctl = phase->C->top(); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
581 |
array_copy_test_overlap(phase, can_reshape, disjoint_bases, count, forward_ctl, backward_ctl); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
582 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
583 |
Node* forward_mem = array_copy_forward(phase, can_reshape, forward_ctl, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
584 |
start_mem_src, start_mem_dest, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
585 |
atp_src, atp_dest, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
586 |
adr_src, base_src, adr_dest, base_dest, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
587 |
copy_type, value_type, count); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
588 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
589 |
Node* backward_mem = array_copy_backward(phase, can_reshape, backward_ctl, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
590 |
start_mem_src, start_mem_dest, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
591 |
atp_src, atp_dest, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
592 |
adr_src, base_src, adr_dest, base_dest, |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
593 |
copy_type, value_type, count); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
594 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
595 |
Node* ctl = NULL; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
596 |
if (!forward_ctl->is_top() && !backward_ctl->is_top()) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
597 |
ctl = new RegionNode(3); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
598 |
mem = new PhiNode(ctl, Type::MEMORY, atp_dest); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
599 |
ctl->init_req(1, forward_ctl); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
600 |
mem->init_req(1, forward_mem); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
601 |
ctl->init_req(2, backward_ctl); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
602 |
mem->init_req(2, backward_mem); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
603 |
ctl = phase->transform(ctl); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
604 |
mem = phase->transform(mem); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
605 |
} else if (!forward_ctl->is_top()) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
606 |
ctl = forward_ctl; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
607 |
mem = forward_mem; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
608 |
} else { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
609 |
assert(!backward_ctl->is_top(), "no copy?"); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
610 |
ctl = backward_ctl; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
611 |
mem = backward_mem; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
612 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
613 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
614 |
if (can_reshape) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
615 |
assert(phase->is_IterGVN()->delay_transform(), "should be delaying transforms"); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
616 |
phase->is_IterGVN()->set_delay_transform(false); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
617 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
618 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
619 |
MergeMemNode* out_mem = MergeMemNode::make(in_mem); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
620 |
out_mem->set_memory_at(alias_idx_dest, mem); |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
621 |
mem = out_mem; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
622 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
623 |
if (!finish_transform(phase, can_reshape, ctl, mem)) { |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
624 |
return NULL; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
625 |
} |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
626 |
|
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
627 |
return mem; |
ef2be52deeaf
6912521: System.arraycopy works slower than the simple loop for little lengths
roland
parents:
diff
changeset
|
628 |
} |
30629
b6e5ad2f18d5
8076188: Optimize arraycopy out for non escaping destination
roland
parents:
29360
diff
changeset
|
629 |
|
b6e5ad2f18d5
8076188: Optimize arraycopy out for non escaping destination
roland
parents:
29360
diff
changeset
|
630 |
bool ArrayCopyNode::may_modify(const TypeOopPtr *t_oop, PhaseTransform *phase) { |
31044
9fecc7e87949
8080699: Assert failed: Not a Java pointer in JCK test
roland
parents:
30629
diff
changeset
|
631 |
Node* dest = in(ArrayCopyNode::Dest); |
9fecc7e87949
8080699: Assert failed: Not a Java pointer in JCK test
roland
parents:
30629
diff
changeset
|
632 |
if (dest->is_top()) { |
9fecc7e87949
8080699: Assert failed: Not a Java pointer in JCK test
roland
parents:
30629
diff
changeset
|
633 |
return false; |
9fecc7e87949
8080699: Assert failed: Not a Java pointer in JCK test
roland
parents:
30629
diff
changeset
|
634 |
} |
9fecc7e87949
8080699: Assert failed: Not a Java pointer in JCK test
roland
parents:
30629
diff
changeset
|
635 |
const TypeOopPtr* dest_t = phase->type(dest)->is_oopptr(); |
30629
b6e5ad2f18d5
8076188: Optimize arraycopy out for non escaping destination
roland
parents:
29360
diff
changeset
|
636 |
assert(!dest_t->is_known_instance() || _dest_type->is_known_instance(), "result of EA not recorded"); |
31044
9fecc7e87949
8080699: Assert failed: Not a Java pointer in JCK test
roland
parents:
30629
diff
changeset
|
637 |
assert(in(ArrayCopyNode::Src)->is_top() || !phase->type(in(ArrayCopyNode::Src))->is_oopptr()->is_known_instance() || |
9fecc7e87949
8080699: Assert failed: Not a Java pointer in JCK test
roland
parents:
30629
diff
changeset
|
638 |
_src_type->is_known_instance(), "result of EA not recorded"); |
30629
b6e5ad2f18d5
8076188: Optimize arraycopy out for non escaping destination
roland
parents:
29360
diff
changeset
|
639 |
|
b6e5ad2f18d5
8076188: Optimize arraycopy out for non escaping destination
roland
parents:
29360
diff
changeset
|
640 |
if (_dest_type != TypeOopPtr::BOTTOM || t_oop->is_known_instance()) { |
b6e5ad2f18d5
8076188: Optimize arraycopy out for non escaping destination
roland
parents:
29360
diff
changeset
|
641 |
assert(_dest_type == TypeOopPtr::BOTTOM || _dest_type->is_known_instance(), "result of EA is known instance"); |
b6e5ad2f18d5
8076188: Optimize arraycopy out for non escaping destination
roland
parents:
29360
diff
changeset
|
642 |
return t_oop->instance_id() == _dest_type->instance_id(); |
b6e5ad2f18d5
8076188: Optimize arraycopy out for non escaping destination
roland
parents:
29360
diff
changeset
|
643 |
} |
b6e5ad2f18d5
8076188: Optimize arraycopy out for non escaping destination
roland
parents:
29360
diff
changeset
|
644 |
|
b6e5ad2f18d5
8076188: Optimize arraycopy out for non escaping destination
roland
parents:
29360
diff
changeset
|
645 |
return CallNode::may_modify_arraycopy_helper(dest_t, t_oop, phase); |
b6e5ad2f18d5
8076188: Optimize arraycopy out for non escaping destination
roland
parents:
29360
diff
changeset
|
646 |
} |
32370
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
647 |
|
45427
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
648 |
bool ArrayCopyNode::may_modify_helper(const TypeOopPtr *t_oop, Node* n, PhaseTransform *phase, CallNode*& call) { |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
649 |
if (n != NULL && |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
650 |
n->is_Call() && |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
651 |
n->as_Call()->may_modify(t_oop, phase) && |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
652 |
(n->as_Call()->is_ArrayCopy() || n->as_Call()->is_call_to_arraycopystub())) { |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
653 |
call = n->as_Call(); |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
654 |
return true; |
32370
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
655 |
} |
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
656 |
return false; |
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
657 |
} |
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
658 |
|
45427
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
659 |
bool ArrayCopyNode::may_modify(const TypeOopPtr *t_oop, MemBarNode* mb, PhaseTransform *phase, ArrayCopyNode*& ac) { |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
660 |
|
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
661 |
Node* c = mb->in(0); |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
662 |
|
50180 | 663 |
BarrierSetC2* bs = BarrierSet::barrier_set()->barrier_set_c2(); |
664 |
// step over g1 gc barrier if we're at e.g. a clone with ReduceInitialCardMarks off |
|
665 |
c = bs->step_over_gc_barrier(c); |
|
45427
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
666 |
|
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
667 |
CallNode* call = NULL; |
51078 | 668 |
guarantee(c != NULL, "step_over_gc_barrier failed, there must be something to step to."); |
669 |
if (c->is_Region()) { |
|
45427
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
670 |
for (uint i = 1; i < c->req(); i++) { |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
671 |
if (c->in(i) != NULL) { |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
672 |
Node* n = c->in(i)->in(0); |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
673 |
if (may_modify_helper(t_oop, n, phase, call)) { |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
674 |
ac = call->isa_ArrayCopy(); |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
675 |
assert(c == mb->in(0), "only for clone"); |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
676 |
return true; |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
677 |
} |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
678 |
} |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
679 |
} |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
680 |
} else if (may_modify_helper(t_oop, c->in(0), phase, call)) { |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
681 |
ac = call->isa_ArrayCopy(); |
50180 | 682 |
#ifdef ASSERT |
683 |
bool use_ReduceInitialCardMarks = BarrierSet::barrier_set()->is_a(BarrierSet::CardTableBarrierSet) && |
|
684 |
static_cast<CardTableBarrierSetC2*>(bs)->use_ReduceInitialCardMarks(); |
|
685 |
assert(c == mb->in(0) || (ac != NULL && ac->is_clonebasic() && !use_ReduceInitialCardMarks), "only for clone"); |
|
686 |
#endif |
|
45427
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
687 |
return true; |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
688 |
} |
32370
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
689 |
|
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
690 |
return false; |
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
691 |
} |
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
692 |
|
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
693 |
// Does this array copy modify offsets between offset_lo and offset_hi |
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
694 |
// in the destination array |
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
695 |
// if must_modify is false, return true if the copy could write |
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
696 |
// between offset_lo and offset_hi |
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
697 |
// if must_modify is true, return true if the copy is guaranteed to |
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
698 |
// write between offset_lo and offset_hi |
45427
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
699 |
bool ArrayCopyNode::modifies(intptr_t offset_lo, intptr_t offset_hi, PhaseTransform* phase, bool must_modify) const { |
32370
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
700 |
assert(_kind == ArrayCopy || _kind == CopyOf || _kind == CopyOfRange, "only for real array copies"); |
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
701 |
|
45427
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
702 |
Node* dest = in(Dest); |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
703 |
Node* dest_pos = in(DestPos); |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
704 |
Node* len = in(Length); |
32370
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
705 |
|
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
706 |
const TypeInt *dest_pos_t = phase->type(dest_pos)->isa_int(); |
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
707 |
const TypeInt *len_t = phase->type(len)->isa_int(); |
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
708 |
const TypeAryPtr* ary_t = phase->type(dest)->isa_aryptr(); |
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
709 |
|
45427
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
710 |
if (dest_pos_t == NULL || len_t == NULL || ary_t == NULL) { |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
711 |
return !must_modify; |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
712 |
} |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
713 |
|
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
714 |
BasicType ary_elem = ary_t->klass()->as_array_klass()->element_type()->basic_type(); |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
715 |
uint header = arrayOopDesc::base_offset_in_bytes(ary_elem); |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
716 |
uint elemsize = type2aelembytes(ary_elem); |
32370
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
717 |
|
45427
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
718 |
jlong dest_pos_plus_len_lo = (((jlong)dest_pos_t->_lo) + len_t->_lo) * elemsize + header; |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
719 |
jlong dest_pos_plus_len_hi = (((jlong)dest_pos_t->_hi) + len_t->_hi) * elemsize + header; |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
720 |
jlong dest_pos_lo = ((jlong)dest_pos_t->_lo) * elemsize + header; |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
721 |
jlong dest_pos_hi = ((jlong)dest_pos_t->_hi) * elemsize + header; |
32370
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
722 |
|
45427
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
723 |
if (must_modify) { |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
724 |
if (offset_lo >= dest_pos_hi && offset_hi < dest_pos_plus_len_lo) { |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
725 |
return true; |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
726 |
} |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
727 |
} else { |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
728 |
if (offset_hi >= dest_pos_lo && offset_lo < dest_pos_plus_len_hi) { |
64e07017ce01
8179678: ArrayCopy with same src and dst can cause incorrect execution or compiler crash
roland
parents:
44322
diff
changeset
|
729 |
return true; |
32370
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
730 |
} |
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
731 |
} |
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
732 |
return false; |
38b7b5772b4f
8130847: Cloned object's fields observed as null after C2 escape analysis
roland
parents:
32084
diff
changeset
|
733 |
} |