author | pliden |
Thu, 12 Apr 2018 11:22:24 +0200 | |
changeset 49754 | ee93c1087584 |
parent 49748 | 6a880e576856 |
child 50162 | f9fe56417050 |
permissions | -rw-r--r-- |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1 |
/* |
48626
9f6f48d4f9a1
8194814: [ppc, s390] A row of minor fixes and cleanups
goetz
parents:
48476
diff
changeset
|
2 |
* Copyright (c) 1997, 2018, Oracle and/or its affiliates. All rights reserved. |
49376
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
3 |
* Copyright (c) 2012, 2018, SAP SE. All rights reserved. |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
4 |
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5 |
* |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
6 |
* This code is free software; you can redistribute it and/or modify it |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
7 |
* under the terms of the GNU General Public License version 2 only, as |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
8 |
* published by the Free Software Foundation. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
9 |
* |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
10 |
* This code is distributed in the hope that it will be useful, but WITHOUT |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
11 |
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
12 |
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
13 |
* version 2 for more details (a copy is included in the LICENSE file that |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
14 |
* accompanied this code). |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
15 |
* |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
16 |
* You should have received a copy of the GNU General Public License version |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
17 |
* 2 along with this work; if not, write to the Free Software Foundation, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
18 |
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
19 |
* |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
20 |
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
21 |
* or visit www.oracle.com if you need additional information or have any |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
22 |
* questions. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
23 |
* |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
24 |
*/ |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
25 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
26 |
#include "precompiled.hpp" |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
27 |
#include "asm/macroAssembler.inline.hpp" |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
28 |
#include "compiler/disassembler.hpp" |
30764 | 29 |
#include "gc/shared/collectedHeap.inline.hpp" |
49748 | 30 |
#include "gc/shared/barrierSet.hpp" |
31 |
#include "gc/shared/barrierSetAssembler.hpp" |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
32 |
#include "interpreter/interpreter.hpp" |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
33 |
#include "memory/resourceArea.hpp" |
35085 | 34 |
#include "nativeInst_ppc.hpp" |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
35 |
#include "prims/methodHandles.hpp" |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
36 |
#include "runtime/biasedLocking.hpp" |
25715
d5a8dbdc5150
8049325: Introduce and clean up umbrella headers for the files in the cpu subdirectories.
goetz
parents:
25374
diff
changeset
|
37 |
#include "runtime/icache.hpp" |
49449
ef5d5d343e2a
8199263: Split interfaceSupport.hpp to not require including .inline.hpp files
coleenp
parents:
49376
diff
changeset
|
38 |
#include "runtime/interfaceSupport.inline.hpp" |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
39 |
#include "runtime/objectMonitor.hpp" |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
40 |
#include "runtime/os.hpp" |
48332
651a95f30dfb
8193257: PPC64, s390 implementation for Thread-local handshakes
mdoerr
parents:
47580
diff
changeset
|
41 |
#include "runtime/safepoint.hpp" |
651a95f30dfb
8193257: PPC64, s390 implementation for Thread-local handshakes
mdoerr
parents:
47580
diff
changeset
|
42 |
#include "runtime/safepointMechanism.hpp" |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
43 |
#include "runtime/sharedRuntime.hpp" |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
44 |
#include "runtime/stubRoutines.hpp" |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
45 |
#include "utilities/macros.hpp" |
36303
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
46 |
#ifdef COMPILER2 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
47 |
#include "opto/intrinsicnode.hpp" |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
48 |
#endif |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
49 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
50 |
#ifdef PRODUCT |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
51 |
#define BLOCK_COMMENT(str) // nothing |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
52 |
#else |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
53 |
#define BLOCK_COMMENT(str) block_comment(str) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
54 |
#endif |
31861 | 55 |
#define BIND(label) bind(label); BLOCK_COMMENT(#label ":") |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
56 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
57 |
#ifdef ASSERT |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
58 |
// On RISC, there's no benefit to verifying instruction boundaries. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
59 |
bool AbstractAssembler::pd_check_instruction_mark() { return false; } |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
60 |
#endif |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
61 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
62 |
void MacroAssembler::ld_largeoffset_unchecked(Register d, int si31, Register a, int emit_filler_nop) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
63 |
assert(Assembler::is_simm(si31, 31) && si31 >= 0, "si31 out of range"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
64 |
if (Assembler::is_simm(si31, 16)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
65 |
ld(d, si31, a); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
66 |
if (emit_filler_nop) nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
67 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
68 |
const int hi = MacroAssembler::largeoffset_si16_si16_hi(si31); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
69 |
const int lo = MacroAssembler::largeoffset_si16_si16_lo(si31); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
70 |
addis(d, a, hi); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
71 |
ld(d, lo, d); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
72 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
73 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
74 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
75 |
void MacroAssembler::ld_largeoffset(Register d, int si31, Register a, int emit_filler_nop) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
76 |
assert_different_registers(d, a); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
77 |
ld_largeoffset_unchecked(d, si31, a, emit_filler_nop); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
78 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
79 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
80 |
void MacroAssembler::load_sized_value(Register dst, RegisterOrConstant offs, Register base, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
81 |
size_t size_in_bytes, bool is_signed) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
82 |
switch (size_in_bytes) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
83 |
case 8: ld(dst, offs, base); break; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
84 |
case 4: is_signed ? lwa(dst, offs, base) : lwz(dst, offs, base); break; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
85 |
case 2: is_signed ? lha(dst, offs, base) : lhz(dst, offs, base); break; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
86 |
case 1: lbz(dst, offs, base); if (is_signed) extsb(dst, dst); break; // lba doesn't exist :( |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
87 |
default: ShouldNotReachHere(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
88 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
89 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
90 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
91 |
void MacroAssembler::store_sized_value(Register dst, RegisterOrConstant offs, Register base, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
92 |
size_t size_in_bytes) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
93 |
switch (size_in_bytes) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
94 |
case 8: std(dst, offs, base); break; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
95 |
case 4: stw(dst, offs, base); break; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
96 |
case 2: sth(dst, offs, base); break; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
97 |
case 1: stb(dst, offs, base); break; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
98 |
default: ShouldNotReachHere(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
99 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
100 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
101 |
|
22861 | 102 |
void MacroAssembler::align(int modulus, int max, int rem) { |
103 |
int padding = (rem + modulus - (offset() % modulus)) % modulus; |
|
104 |
if (padding > max) return; |
|
105 |
for (int c = (padding >> 2); c > 0; --c) { nop(); } |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
106 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
107 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
108 |
// Issue instructions that calculate given TOC from global TOC. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
109 |
void MacroAssembler::calculate_address_from_global_toc(Register dst, address addr, bool hi16, bool lo16, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
110 |
bool add_relocation, bool emit_dummy_addr) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
111 |
int offset = -1; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
112 |
if (emit_dummy_addr) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
113 |
offset = -128; // dummy address |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
114 |
} else if (addr != (address)(intptr_t)-1) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
115 |
offset = MacroAssembler::offset_to_global_toc(addr); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
116 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
117 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
118 |
if (hi16) { |
35085 | 119 |
addis(dst, R29_TOC, MacroAssembler::largeoffset_si16_si16_hi(offset)); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
120 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
121 |
if (lo16) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
122 |
if (add_relocation) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
123 |
// Relocate at the addi to avoid confusion with a load from the method's TOC. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
124 |
relocate(internal_word_Relocation::spec(addr)); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
125 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
126 |
addi(dst, dst, MacroAssembler::largeoffset_si16_si16_lo(offset)); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
127 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
128 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
129 |
|
47520
50790528dd25
8187547: PPC64: icache invalidation is incorrect in some places
goetz
parents:
47216
diff
changeset
|
130 |
address MacroAssembler::patch_calculate_address_from_global_toc_at(address a, address bound, address addr) { |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
131 |
const int offset = MacroAssembler::offset_to_global_toc(addr); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
132 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
133 |
const address inst2_addr = a; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
134 |
const int inst2 = *(int *)inst2_addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
135 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
136 |
// The relocation points to the second instruction, the addi, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
137 |
// and the addi reads and writes the same register dst. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
138 |
const int dst = inv_rt_field(inst2); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
139 |
assert(is_addi(inst2) && inv_ra_field(inst2) == dst, "must be addi reading and writing dst"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
140 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
141 |
// Now, find the preceding addis which writes to dst. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
142 |
int inst1 = 0; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
143 |
address inst1_addr = inst2_addr - BytesPerInstWord; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
144 |
while (inst1_addr >= bound) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
145 |
inst1 = *(int *) inst1_addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
146 |
if (is_addis(inst1) && inv_rt_field(inst1) == dst) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
147 |
// Stop, found the addis which writes dst. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
148 |
break; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
149 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
150 |
inst1_addr -= BytesPerInstWord; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
151 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
152 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
153 |
assert(is_addis(inst1) && inv_ra_field(inst1) == 29 /* R29 */, "source must be global TOC"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
154 |
set_imm((int *)inst1_addr, MacroAssembler::largeoffset_si16_si16_hi(offset)); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
155 |
set_imm((int *)inst2_addr, MacroAssembler::largeoffset_si16_si16_lo(offset)); |
47520
50790528dd25
8187547: PPC64: icache invalidation is incorrect in some places
goetz
parents:
47216
diff
changeset
|
156 |
return inst1_addr; |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
157 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
158 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
159 |
address MacroAssembler::get_address_of_calculate_address_from_global_toc_at(address a, address bound) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
160 |
const address inst2_addr = a; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
161 |
const int inst2 = *(int *)inst2_addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
162 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
163 |
// The relocation points to the second instruction, the addi, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
164 |
// and the addi reads and writes the same register dst. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
165 |
const int dst = inv_rt_field(inst2); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
166 |
assert(is_addi(inst2) && inv_ra_field(inst2) == dst, "must be addi reading and writing dst"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
167 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
168 |
// Now, find the preceding addis which writes to dst. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
169 |
int inst1 = 0; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
170 |
address inst1_addr = inst2_addr - BytesPerInstWord; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
171 |
while (inst1_addr >= bound) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
172 |
inst1 = *(int *) inst1_addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
173 |
if (is_addis(inst1) && inv_rt_field(inst1) == dst) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
174 |
// stop, found the addis which writes dst |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
175 |
break; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
176 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
177 |
inst1_addr -= BytesPerInstWord; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
178 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
179 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
180 |
assert(is_addis(inst1) && inv_ra_field(inst1) == 29 /* R29 */, "source must be global TOC"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
181 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
182 |
int offset = (get_imm(inst1_addr, 0) << 16) + get_imm(inst2_addr, 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
183 |
// -1 is a special case |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
184 |
if (offset == -1) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
185 |
return (address)(intptr_t)-1; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
186 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
187 |
return global_toc() + offset; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
188 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
189 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
190 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
191 |
#ifdef _LP64 |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
192 |
// Patch compressed oops or klass constants. |
22861 | 193 |
// Assembler sequence is |
194 |
// 1) compressed oops: |
|
195 |
// lis rx = const.hi |
|
196 |
// ori rx = rx | const.lo |
|
197 |
// 2) compressed klass: |
|
198 |
// lis rx = const.hi |
|
199 |
// clrldi rx = rx & 0xFFFFffff // clearMS32b, optional |
|
200 |
// ori rx = rx | const.lo |
|
201 |
// Clrldi will be passed by. |
|
47520
50790528dd25
8187547: PPC64: icache invalidation is incorrect in some places
goetz
parents:
47216
diff
changeset
|
202 |
address MacroAssembler::patch_set_narrow_oop(address a, address bound, narrowOop data) { |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
203 |
assert(UseCompressedOops, "Should only patch compressed oops"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
204 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
205 |
const address inst2_addr = a; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
206 |
const int inst2 = *(int *)inst2_addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
207 |
|
22861 | 208 |
// The relocation points to the second instruction, the ori, |
209 |
// and the ori reads and writes the same register dst. |
|
210 |
const int dst = inv_rta_field(inst2); |
|
22867 | 211 |
assert(is_ori(inst2) && inv_rs_field(inst2) == dst, "must be ori reading and writing dst"); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
212 |
// Now, find the preceding addis which writes to dst. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
213 |
int inst1 = 0; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
214 |
address inst1_addr = inst2_addr - BytesPerInstWord; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
215 |
bool inst1_found = false; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
216 |
while (inst1_addr >= bound) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
217 |
inst1 = *(int *)inst1_addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
218 |
if (is_lis(inst1) && inv_rs_field(inst1) == dst) { inst1_found = true; break; } |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
219 |
inst1_addr -= BytesPerInstWord; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
220 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
221 |
assert(inst1_found, "inst is not lis"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
222 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
223 |
int xc = (data >> 16) & 0xffff; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
224 |
int xd = (data >> 0) & 0xffff; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
225 |
|
22861 | 226 |
set_imm((int *)inst1_addr, (short)(xc)); // see enc_load_con_narrow_hi/_lo |
22867 | 227 |
set_imm((int *)inst2_addr, (xd)); // unsigned int |
47520
50790528dd25
8187547: PPC64: icache invalidation is incorrect in some places
goetz
parents:
47216
diff
changeset
|
228 |
return inst1_addr; |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
229 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
230 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
231 |
// Get compressed oop or klass constant. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
232 |
narrowOop MacroAssembler::get_narrow_oop(address a, address bound) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
233 |
assert(UseCompressedOops, "Should only patch compressed oops"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
234 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
235 |
const address inst2_addr = a; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
236 |
const int inst2 = *(int *)inst2_addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
237 |
|
22861 | 238 |
// The relocation points to the second instruction, the ori, |
239 |
// and the ori reads and writes the same register dst. |
|
240 |
const int dst = inv_rta_field(inst2); |
|
22867 | 241 |
assert(is_ori(inst2) && inv_rs_field(inst2) == dst, "must be ori reading and writing dst"); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
242 |
// Now, find the preceding lis which writes to dst. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
243 |
int inst1 = 0; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
244 |
address inst1_addr = inst2_addr - BytesPerInstWord; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
245 |
bool inst1_found = false; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
246 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
247 |
while (inst1_addr >= bound) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
248 |
inst1 = *(int *) inst1_addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
249 |
if (is_lis(inst1) && inv_rs_field(inst1) == dst) { inst1_found = true; break;} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
250 |
inst1_addr -= BytesPerInstWord; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
251 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
252 |
assert(inst1_found, "inst is not lis"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
253 |
|
22861 | 254 |
uint xl = ((unsigned int) (get_imm(inst2_addr, 0) & 0xffff)); |
255 |
uint xh = (((get_imm(inst1_addr, 0)) & 0xffff) << 16); |
|
256 |
||
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
257 |
return (int) (xl | xh); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
258 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
259 |
#endif // _LP64 |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
260 |
|
35085 | 261 |
// Returns true if successful. |
262 |
bool MacroAssembler::load_const_from_method_toc(Register dst, AddressLiteral& a, |
|
263 |
Register toc, bool fixed_size) { |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
264 |
int toc_offset = 0; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
265 |
// Use RelocationHolder::none for the constant pool entry, otherwise |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
266 |
// we will end up with a failing NativeCall::verify(x) where x is |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
267 |
// the address of the constant pool entry. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
268 |
// FIXME: We should insert relocation information for oops at the constant |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
269 |
// pool entries instead of inserting it at the loads; patching of a constant |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
270 |
// pool entry should be less expensive. |
35085 | 271 |
address const_address = address_constant((address)a.value(), RelocationHolder::none); |
272 |
if (const_address == NULL) { return false; } // allocation failure |
|
22861 | 273 |
// Relocate at the pc of the load. |
274 |
relocate(a.rspec()); |
|
35085 | 275 |
toc_offset = (int)(const_address - code()->consts()->start()); |
276 |
ld_largeoffset_unchecked(dst, toc_offset, toc, fixed_size); |
|
277 |
return true; |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
278 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
279 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
280 |
bool MacroAssembler::is_load_const_from_method_toc_at(address a) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
281 |
const address inst1_addr = a; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
282 |
const int inst1 = *(int *)inst1_addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
283 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
284 |
// The relocation points to the ld or the addis. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
285 |
return (is_ld(inst1)) || |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
286 |
(is_addis(inst1) && inv_ra_field(inst1) != 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
287 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
288 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
289 |
int MacroAssembler::get_offset_of_load_const_from_method_toc_at(address a) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
290 |
assert(is_load_const_from_method_toc_at(a), "must be load_const_from_method_toc"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
291 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
292 |
const address inst1_addr = a; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
293 |
const int inst1 = *(int *)inst1_addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
294 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
295 |
if (is_ld(inst1)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
296 |
return inv_d1_field(inst1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
297 |
} else if (is_addis(inst1)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
298 |
const int dst = inv_rt_field(inst1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
299 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
300 |
// Now, find the succeeding ld which reads and writes to dst. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
301 |
address inst2_addr = inst1_addr + BytesPerInstWord; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
302 |
int inst2 = 0; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
303 |
while (true) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
304 |
inst2 = *(int *) inst2_addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
305 |
if (is_ld(inst2) && inv_ra_field(inst2) == dst && inv_rt_field(inst2) == dst) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
306 |
// Stop, found the ld which reads and writes dst. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
307 |
break; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
308 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
309 |
inst2_addr += BytesPerInstWord; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
310 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
311 |
return (inv_d1_field(inst1) << 16) + inv_d1_field(inst2); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
312 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
313 |
ShouldNotReachHere(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
314 |
return 0; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
315 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
316 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
317 |
// Get the constant from a `load_const' sequence. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
318 |
long MacroAssembler::get_const(address a) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
319 |
assert(is_load_const_at(a), "not a load of a constant"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
320 |
const int *p = (const int*) a; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
321 |
unsigned long x = (((unsigned long) (get_imm(a,0) & 0xffff)) << 48); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
322 |
if (is_ori(*(p+1))) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
323 |
x |= (((unsigned long) (get_imm(a,1) & 0xffff)) << 32); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
324 |
x |= (((unsigned long) (get_imm(a,3) & 0xffff)) << 16); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
325 |
x |= (((unsigned long) (get_imm(a,4) & 0xffff))); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
326 |
} else if (is_lis(*(p+1))) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
327 |
x |= (((unsigned long) (get_imm(a,2) & 0xffff)) << 32); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
328 |
x |= (((unsigned long) (get_imm(a,1) & 0xffff)) << 16); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
329 |
x |= (((unsigned long) (get_imm(a,3) & 0xffff))); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
330 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
331 |
ShouldNotReachHere(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
332 |
return (long) 0; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
333 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
334 |
return (long) x; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
335 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
336 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
337 |
// Patch the 64 bit constant of a `load_const' sequence. This is a low |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
338 |
// level procedure. It neither flushes the instruction cache nor is it |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
339 |
// mt safe. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
340 |
void MacroAssembler::patch_const(address a, long x) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
341 |
assert(is_load_const_at(a), "not a load of a constant"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
342 |
int *p = (int*) a; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
343 |
if (is_ori(*(p+1))) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
344 |
set_imm(0 + p, (x >> 48) & 0xffff); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
345 |
set_imm(1 + p, (x >> 32) & 0xffff); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
346 |
set_imm(3 + p, (x >> 16) & 0xffff); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
347 |
set_imm(4 + p, x & 0xffff); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
348 |
} else if (is_lis(*(p+1))) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
349 |
set_imm(0 + p, (x >> 48) & 0xffff); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
350 |
set_imm(2 + p, (x >> 32) & 0xffff); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
351 |
set_imm(1 + p, (x >> 16) & 0xffff); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
352 |
set_imm(3 + p, x & 0xffff); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
353 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
354 |
ShouldNotReachHere(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
355 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
356 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
357 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
358 |
AddressLiteral MacroAssembler::allocate_metadata_address(Metadata* obj) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
359 |
assert(oop_recorder() != NULL, "this assembler needs a Recorder"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
360 |
int index = oop_recorder()->allocate_metadata_index(obj); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
361 |
RelocationHolder rspec = metadata_Relocation::spec(index); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
362 |
return AddressLiteral((address)obj, rspec); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
363 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
364 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
365 |
AddressLiteral MacroAssembler::constant_metadata_address(Metadata* obj) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
366 |
assert(oop_recorder() != NULL, "this assembler needs a Recorder"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
367 |
int index = oop_recorder()->find_index(obj); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
368 |
RelocationHolder rspec = metadata_Relocation::spec(index); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
369 |
return AddressLiteral((address)obj, rspec); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
370 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
371 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
372 |
AddressLiteral MacroAssembler::allocate_oop_address(jobject obj) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
373 |
assert(oop_recorder() != NULL, "this assembler needs an OopRecorder"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
374 |
int oop_index = oop_recorder()->allocate_oop_index(obj); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
375 |
return AddressLiteral(address(obj), oop_Relocation::spec(oop_index)); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
376 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
377 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
378 |
AddressLiteral MacroAssembler::constant_oop_address(jobject obj) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
379 |
assert(oop_recorder() != NULL, "this assembler needs an OopRecorder"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
380 |
int oop_index = oop_recorder()->find_index(obj); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
381 |
return AddressLiteral(address(obj), oop_Relocation::spec(oop_index)); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
382 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
383 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
384 |
RegisterOrConstant MacroAssembler::delayed_value_impl(intptr_t* delayed_value_addr, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
385 |
Register tmp, int offset) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
386 |
intptr_t value = *delayed_value_addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
387 |
if (value != 0) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
388 |
return RegisterOrConstant(value + offset); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
389 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
390 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
391 |
// Load indirectly to solve generation ordering problem. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
392 |
// static address, no relocation |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
393 |
int simm16_offset = load_const_optimized(tmp, delayed_value_addr, noreg, true); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
394 |
ld(tmp, simm16_offset, tmp); // must be aligned ((xa & 3) == 0) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
395 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
396 |
if (offset != 0) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
397 |
addi(tmp, tmp, offset); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
398 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
399 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
400 |
return RegisterOrConstant(tmp); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
401 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
402 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
403 |
#ifndef PRODUCT |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
404 |
void MacroAssembler::pd_print_patched_instruction(address branch) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
405 |
Unimplemented(); // TODO: PPC port |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
406 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
407 |
#endif // ndef PRODUCT |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
408 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
409 |
// Conditional far branch for destinations encodable in 24+2 bits. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
410 |
void MacroAssembler::bc_far(int boint, int biint, Label& dest, int optimize) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
411 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
412 |
// If requested by flag optimize, relocate the bc_far as a |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
413 |
// runtime_call and prepare for optimizing it when the code gets |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
414 |
// relocated. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
415 |
if (optimize == bc_far_optimize_on_relocate) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
416 |
relocate(relocInfo::runtime_call_type); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
417 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
418 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
419 |
// variant 2: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
420 |
// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
421 |
// b!cxx SKIP |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
422 |
// bxx DEST |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
423 |
// SKIP: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
424 |
// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
425 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
426 |
const int opposite_boint = add_bhint_to_boint(opposite_bhint(inv_boint_bhint(boint)), |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
427 |
opposite_bcond(inv_boint_bcond(boint))); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
428 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
429 |
// We emit two branches. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
430 |
// First, a conditional branch which jumps around the far branch. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
431 |
const address not_taken_pc = pc() + 2 * BytesPerInstWord; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
432 |
const address bc_pc = pc(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
433 |
bc(opposite_boint, biint, not_taken_pc); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
434 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
435 |
const int bc_instr = *(int*)bc_pc; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
436 |
assert(not_taken_pc == (address)inv_bd_field(bc_instr, (intptr_t)bc_pc), "postcondition"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
437 |
assert(opposite_boint == inv_bo_field(bc_instr), "postcondition"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
438 |
assert(boint == add_bhint_to_boint(opposite_bhint(inv_boint_bhint(inv_bo_field(bc_instr))), |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
439 |
opposite_bcond(inv_boint_bcond(inv_bo_field(bc_instr)))), |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
440 |
"postcondition"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
441 |
assert(biint == inv_bi_field(bc_instr), "postcondition"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
442 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
443 |
// Second, an unconditional far branch which jumps to dest. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
444 |
// Note: target(dest) remembers the current pc (see CodeSection::target) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
445 |
// and returns the current pc if the label is not bound yet; when |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
446 |
// the label gets bound, the unconditional far branch will be patched. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
447 |
const address target_pc = target(dest); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
448 |
const address b_pc = pc(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
449 |
b(target_pc); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
450 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
451 |
assert(not_taken_pc == pc(), "postcondition"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
452 |
assert(dest.is_bound() || target_pc == b_pc, "postcondition"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
453 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
454 |
|
35085 | 455 |
// 1 or 2 instructions |
456 |
void MacroAssembler::bc_far_optimized(int boint, int biint, Label& dest) { |
|
457 |
if (dest.is_bound() && is_within_range_of_bcxx(target(dest), pc())) { |
|
458 |
bc(boint, biint, dest); |
|
459 |
} else { |
|
460 |
bc_far(boint, biint, dest, MacroAssembler::bc_far_optimize_on_relocate); |
|
461 |
} |
|
462 |
} |
|
463 |
||
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
464 |
bool MacroAssembler::is_bc_far_at(address instruction_addr) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
465 |
return is_bc_far_variant1_at(instruction_addr) || |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
466 |
is_bc_far_variant2_at(instruction_addr) || |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
467 |
is_bc_far_variant3_at(instruction_addr); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
468 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
469 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
470 |
address MacroAssembler::get_dest_of_bc_far_at(address instruction_addr) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
471 |
if (is_bc_far_variant1_at(instruction_addr)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
472 |
const address instruction_1_addr = instruction_addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
473 |
const int instruction_1 = *(int*)instruction_1_addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
474 |
return (address)inv_bd_field(instruction_1, (intptr_t)instruction_1_addr); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
475 |
} else if (is_bc_far_variant2_at(instruction_addr)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
476 |
const address instruction_2_addr = instruction_addr + 4; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
477 |
return bxx_destination(instruction_2_addr); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
478 |
} else if (is_bc_far_variant3_at(instruction_addr)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
479 |
return instruction_addr + 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
480 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
481 |
// variant 4 ??? |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
482 |
ShouldNotReachHere(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
483 |
return NULL; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
484 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
485 |
void MacroAssembler::set_dest_of_bc_far_at(address instruction_addr, address dest) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
486 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
487 |
if (is_bc_far_variant3_at(instruction_addr)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
488 |
// variant 3, far cond branch to the next instruction, already patched to nops: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
489 |
// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
490 |
// nop |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
491 |
// endgroup |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
492 |
// SKIP/DEST: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
493 |
// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
494 |
return; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
495 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
496 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
497 |
// first, extract boint and biint from the current branch |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
498 |
int boint = 0; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
499 |
int biint = 0; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
500 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
501 |
ResourceMark rm; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
502 |
const int code_size = 2 * BytesPerInstWord; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
503 |
CodeBuffer buf(instruction_addr, code_size); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
504 |
MacroAssembler masm(&buf); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
505 |
if (is_bc_far_variant2_at(instruction_addr) && dest == instruction_addr + 8) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
506 |
// Far branch to next instruction: Optimize it by patching nops (produce variant 3). |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
507 |
masm.nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
508 |
masm.endgroup(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
509 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
510 |
if (is_bc_far_variant1_at(instruction_addr)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
511 |
// variant 1, the 1st instruction contains the destination address: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
512 |
// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
513 |
// bcxx DEST |
35085 | 514 |
// nop |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
515 |
// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
516 |
const int instruction_1 = *(int*)(instruction_addr); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
517 |
boint = inv_bo_field(instruction_1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
518 |
biint = inv_bi_field(instruction_1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
519 |
} else if (is_bc_far_variant2_at(instruction_addr)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
520 |
// variant 2, the 2nd instruction contains the destination address: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
521 |
// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
522 |
// b!cxx SKIP |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
523 |
// bxx DEST |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
524 |
// SKIP: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
525 |
// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
526 |
const int instruction_1 = *(int*)(instruction_addr); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
527 |
boint = add_bhint_to_boint(opposite_bhint(inv_boint_bhint(inv_bo_field(instruction_1))), |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
528 |
opposite_bcond(inv_boint_bcond(inv_bo_field(instruction_1)))); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
529 |
biint = inv_bi_field(instruction_1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
530 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
531 |
// variant 4??? |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
532 |
ShouldNotReachHere(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
533 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
534 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
535 |
// second, set the new branch destination and optimize the code |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
536 |
if (dest != instruction_addr + 4 && // the bc_far is still unbound! |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
537 |
masm.is_within_range_of_bcxx(dest, instruction_addr)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
538 |
// variant 1: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
539 |
// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
540 |
// bcxx DEST |
35085 | 541 |
// nop |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
542 |
// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
543 |
masm.bc(boint, biint, dest); |
35085 | 544 |
masm.nop(); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
545 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
546 |
// variant 2: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
547 |
// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
548 |
// b!cxx SKIP |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
549 |
// bxx DEST |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
550 |
// SKIP: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
551 |
// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
552 |
const int opposite_boint = add_bhint_to_boint(opposite_bhint(inv_boint_bhint(boint)), |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
553 |
opposite_bcond(inv_boint_bcond(boint))); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
554 |
const address not_taken_pc = masm.pc() + 2 * BytesPerInstWord; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
555 |
masm.bc(opposite_boint, biint, not_taken_pc); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
556 |
masm.b(dest); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
557 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
558 |
} |
22861 | 559 |
ICache::ppc64_flush_icache_bytes(instruction_addr, code_size); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
560 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
561 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
562 |
// Emit a NOT mt-safe patchable 64 bit absolute call/jump. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
563 |
void MacroAssembler::bxx64_patchable(address dest, relocInfo::relocType rt, bool link) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
564 |
// get current pc |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
565 |
uint64_t start_pc = (uint64_t) pc(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
566 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
567 |
const address pc_of_bl = (address) (start_pc + (6*BytesPerInstWord)); // bl is last |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
568 |
const address pc_of_b = (address) (start_pc + (0*BytesPerInstWord)); // b is first |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
569 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
570 |
// relocate here |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
571 |
if (rt != relocInfo::none) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
572 |
relocate(rt); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
573 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
574 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
575 |
if ( ReoptimizeCallSequences && |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
576 |
(( link && is_within_range_of_b(dest, pc_of_bl)) || |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
577 |
(!link && is_within_range_of_b(dest, pc_of_b)))) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
578 |
// variant 2: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
579 |
// Emit an optimized, pc-relative call/jump. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
580 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
581 |
if (link) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
582 |
// some padding |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
583 |
nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
584 |
nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
585 |
nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
586 |
nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
587 |
nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
588 |
nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
589 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
590 |
// do the call |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
591 |
assert(pc() == pc_of_bl, "just checking"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
592 |
bl(dest, relocInfo::none); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
593 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
594 |
// do the jump |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
595 |
assert(pc() == pc_of_b, "just checking"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
596 |
b(dest, relocInfo::none); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
597 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
598 |
// some padding |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
599 |
nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
600 |
nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
601 |
nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
602 |
nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
603 |
nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
604 |
nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
605 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
606 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
607 |
// Assert that we can identify the emitted call/jump. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
608 |
assert(is_bxx64_patchable_variant2_at((address)start_pc, link), |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
609 |
"can't identify emitted call"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
610 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
611 |
// variant 1: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
612 |
mr(R0, R11); // spill R11 -> R0. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
613 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
614 |
// Load the destination address into CTR, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
615 |
// calculate destination relative to global toc. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
616 |
calculate_address_from_global_toc(R11, dest, true, true, false); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
617 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
618 |
mtctr(R11); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
619 |
mr(R11, R0); // spill R11 <- R0. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
620 |
nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
621 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
622 |
// do the call/jump |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
623 |
if (link) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
624 |
bctrl(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
625 |
} else{ |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
626 |
bctr(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
627 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
628 |
// Assert that we can identify the emitted call/jump. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
629 |
assert(is_bxx64_patchable_variant1b_at((address)start_pc, link), |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
630 |
"can't identify emitted call"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
631 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
632 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
633 |
// Assert that we can identify the emitted call/jump. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
634 |
assert(is_bxx64_patchable_at((address)start_pc, link), |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
635 |
"can't identify emitted call"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
636 |
assert(get_dest_of_bxx64_patchable_at((address)start_pc, link) == dest, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
637 |
"wrong encoding of dest address"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
638 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
639 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
640 |
// Identify a bxx64_patchable instruction. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
641 |
bool MacroAssembler::is_bxx64_patchable_at(address instruction_addr, bool link) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
642 |
return is_bxx64_patchable_variant1b_at(instruction_addr, link) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
643 |
//|| is_bxx64_patchable_variant1_at(instruction_addr, link) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
644 |
|| is_bxx64_patchable_variant2_at(instruction_addr, link); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
645 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
646 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
647 |
// Does the call64_patchable instruction use a pc-relative encoding of |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
648 |
// the call destination? |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
649 |
bool MacroAssembler::is_bxx64_patchable_pcrelative_at(address instruction_addr, bool link) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
650 |
// variant 2 is pc-relative |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
651 |
return is_bxx64_patchable_variant2_at(instruction_addr, link); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
652 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
653 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
654 |
// Identify variant 1. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
655 |
bool MacroAssembler::is_bxx64_patchable_variant1_at(address instruction_addr, bool link) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
656 |
unsigned int* instr = (unsigned int*) instruction_addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
657 |
return (link ? is_bctrl(instr[6]) : is_bctr(instr[6])) // bctr[l] |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
658 |
&& is_mtctr(instr[5]) // mtctr |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
659 |
&& is_load_const_at(instruction_addr); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
660 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
661 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
662 |
// Identify variant 1b: load destination relative to global toc. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
663 |
bool MacroAssembler::is_bxx64_patchable_variant1b_at(address instruction_addr, bool link) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
664 |
unsigned int* instr = (unsigned int*) instruction_addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
665 |
return (link ? is_bctrl(instr[6]) : is_bctr(instr[6])) // bctr[l] |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
666 |
&& is_mtctr(instr[3]) // mtctr |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
667 |
&& is_calculate_address_from_global_toc_at(instruction_addr + 2*BytesPerInstWord, instruction_addr); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
668 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
669 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
670 |
// Identify variant 2. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
671 |
bool MacroAssembler::is_bxx64_patchable_variant2_at(address instruction_addr, bool link) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
672 |
unsigned int* instr = (unsigned int*) instruction_addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
673 |
if (link) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
674 |
return is_bl (instr[6]) // bl dest is last |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
675 |
&& is_nop(instr[0]) // nop |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
676 |
&& is_nop(instr[1]) // nop |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
677 |
&& is_nop(instr[2]) // nop |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
678 |
&& is_nop(instr[3]) // nop |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
679 |
&& is_nop(instr[4]) // nop |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
680 |
&& is_nop(instr[5]); // nop |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
681 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
682 |
return is_b (instr[0]) // b dest is first |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
683 |
&& is_nop(instr[1]) // nop |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
684 |
&& is_nop(instr[2]) // nop |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
685 |
&& is_nop(instr[3]) // nop |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
686 |
&& is_nop(instr[4]) // nop |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
687 |
&& is_nop(instr[5]) // nop |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
688 |
&& is_nop(instr[6]); // nop |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
689 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
690 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
691 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
692 |
// Set dest address of a bxx64_patchable instruction. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
693 |
void MacroAssembler::set_dest_of_bxx64_patchable_at(address instruction_addr, address dest, bool link) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
694 |
ResourceMark rm; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
695 |
int code_size = MacroAssembler::bxx64_patchable_size; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
696 |
CodeBuffer buf(instruction_addr, code_size); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
697 |
MacroAssembler masm(&buf); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
698 |
masm.bxx64_patchable(dest, relocInfo::none, link); |
22861 | 699 |
ICache::ppc64_flush_icache_bytes(instruction_addr, code_size); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
700 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
701 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
702 |
// Get dest address of a bxx64_patchable instruction. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
703 |
address MacroAssembler::get_dest_of_bxx64_patchable_at(address instruction_addr, bool link) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
704 |
if (is_bxx64_patchable_variant1_at(instruction_addr, link)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
705 |
return (address) (unsigned long) get_const(instruction_addr); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
706 |
} else if (is_bxx64_patchable_variant2_at(instruction_addr, link)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
707 |
unsigned int* instr = (unsigned int*) instruction_addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
708 |
if (link) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
709 |
const int instr_idx = 6; // bl is last |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
710 |
int branchoffset = branch_destination(instr[instr_idx], 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
711 |
return instruction_addr + branchoffset + instr_idx*BytesPerInstWord; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
712 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
713 |
const int instr_idx = 0; // b is first |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
714 |
int branchoffset = branch_destination(instr[instr_idx], 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
715 |
return instruction_addr + branchoffset + instr_idx*BytesPerInstWord; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
716 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
717 |
// Load dest relative to global toc. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
718 |
} else if (is_bxx64_patchable_variant1b_at(instruction_addr, link)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
719 |
return get_address_of_calculate_address_from_global_toc_at(instruction_addr + 2*BytesPerInstWord, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
720 |
instruction_addr); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
721 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
722 |
ShouldNotReachHere(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
723 |
return NULL; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
724 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
725 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
726 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
727 |
// Uses ordering which corresponds to ABI: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
728 |
// _savegpr0_14: std r14,-144(r1) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
729 |
// _savegpr0_15: std r15,-136(r1) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
730 |
// _savegpr0_16: std r16,-128(r1) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
731 |
void MacroAssembler::save_nonvolatile_gprs(Register dst, int offset) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
732 |
std(R14, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
733 |
std(R15, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
734 |
std(R16, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
735 |
std(R17, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
736 |
std(R18, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
737 |
std(R19, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
738 |
std(R20, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
739 |
std(R21, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
740 |
std(R22, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
741 |
std(R23, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
742 |
std(R24, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
743 |
std(R25, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
744 |
std(R26, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
745 |
std(R27, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
746 |
std(R28, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
747 |
std(R29, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
748 |
std(R30, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
749 |
std(R31, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
750 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
751 |
stfd(F14, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
752 |
stfd(F15, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
753 |
stfd(F16, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
754 |
stfd(F17, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
755 |
stfd(F18, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
756 |
stfd(F19, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
757 |
stfd(F20, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
758 |
stfd(F21, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
759 |
stfd(F22, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
760 |
stfd(F23, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
761 |
stfd(F24, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
762 |
stfd(F25, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
763 |
stfd(F26, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
764 |
stfd(F27, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
765 |
stfd(F28, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
766 |
stfd(F29, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
767 |
stfd(F30, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
768 |
stfd(F31, offset, dst); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
769 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
770 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
771 |
// Uses ordering which corresponds to ABI: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
772 |
// _restgpr0_14: ld r14,-144(r1) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
773 |
// _restgpr0_15: ld r15,-136(r1) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
774 |
// _restgpr0_16: ld r16,-128(r1) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
775 |
void MacroAssembler::restore_nonvolatile_gprs(Register src, int offset) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
776 |
ld(R14, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
777 |
ld(R15, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
778 |
ld(R16, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
779 |
ld(R17, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
780 |
ld(R18, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
781 |
ld(R19, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
782 |
ld(R20, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
783 |
ld(R21, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
784 |
ld(R22, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
785 |
ld(R23, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
786 |
ld(R24, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
787 |
ld(R25, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
788 |
ld(R26, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
789 |
ld(R27, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
790 |
ld(R28, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
791 |
ld(R29, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
792 |
ld(R30, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
793 |
ld(R31, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
794 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
795 |
// FP registers |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
796 |
lfd(F14, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
797 |
lfd(F15, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
798 |
lfd(F16, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
799 |
lfd(F17, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
800 |
lfd(F18, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
801 |
lfd(F19, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
802 |
lfd(F20, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
803 |
lfd(F21, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
804 |
lfd(F22, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
805 |
lfd(F23, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
806 |
lfd(F24, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
807 |
lfd(F25, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
808 |
lfd(F26, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
809 |
lfd(F27, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
810 |
lfd(F28, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
811 |
lfd(F29, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
812 |
lfd(F30, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
813 |
lfd(F31, offset, src); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
814 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
815 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
816 |
// For verify_oops. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
817 |
void MacroAssembler::save_volatile_gprs(Register dst, int offset) { |
28187
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
818 |
std(R2, offset, dst); offset += 8; |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
819 |
std(R3, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
820 |
std(R4, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
821 |
std(R5, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
822 |
std(R6, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
823 |
std(R7, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
824 |
std(R8, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
825 |
std(R9, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
826 |
std(R10, offset, dst); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
827 |
std(R11, offset, dst); offset += 8; |
35085 | 828 |
std(R12, offset, dst); offset += 8; |
829 |
||
830 |
stfd(F0, offset, dst); offset += 8; |
|
831 |
stfd(F1, offset, dst); offset += 8; |
|
832 |
stfd(F2, offset, dst); offset += 8; |
|
833 |
stfd(F3, offset, dst); offset += 8; |
|
834 |
stfd(F4, offset, dst); offset += 8; |
|
835 |
stfd(F5, offset, dst); offset += 8; |
|
836 |
stfd(F6, offset, dst); offset += 8; |
|
837 |
stfd(F7, offset, dst); offset += 8; |
|
838 |
stfd(F8, offset, dst); offset += 8; |
|
839 |
stfd(F9, offset, dst); offset += 8; |
|
840 |
stfd(F10, offset, dst); offset += 8; |
|
841 |
stfd(F11, offset, dst); offset += 8; |
|
842 |
stfd(F12, offset, dst); offset += 8; |
|
843 |
stfd(F13, offset, dst); |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
844 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
845 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
846 |
// For verify_oops. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
847 |
void MacroAssembler::restore_volatile_gprs(Register src, int offset) { |
28187
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
848 |
ld(R2, offset, src); offset += 8; |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
849 |
ld(R3, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
850 |
ld(R4, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
851 |
ld(R5, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
852 |
ld(R6, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
853 |
ld(R7, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
854 |
ld(R8, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
855 |
ld(R9, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
856 |
ld(R10, offset, src); offset += 8; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
857 |
ld(R11, offset, src); offset += 8; |
35085 | 858 |
ld(R12, offset, src); offset += 8; |
859 |
||
860 |
lfd(F0, offset, src); offset += 8; |
|
861 |
lfd(F1, offset, src); offset += 8; |
|
862 |
lfd(F2, offset, src); offset += 8; |
|
863 |
lfd(F3, offset, src); offset += 8; |
|
864 |
lfd(F4, offset, src); offset += 8; |
|
865 |
lfd(F5, offset, src); offset += 8; |
|
866 |
lfd(F6, offset, src); offset += 8; |
|
867 |
lfd(F7, offset, src); offset += 8; |
|
868 |
lfd(F8, offset, src); offset += 8; |
|
869 |
lfd(F9, offset, src); offset += 8; |
|
870 |
lfd(F10, offset, src); offset += 8; |
|
871 |
lfd(F11, offset, src); offset += 8; |
|
872 |
lfd(F12, offset, src); offset += 8; |
|
873 |
lfd(F13, offset, src); |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
874 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
875 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
876 |
void MacroAssembler::save_LR_CR(Register tmp) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
877 |
mfcr(tmp); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
878 |
std(tmp, _abi(cr), R1_SP); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
879 |
mflr(tmp); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
880 |
std(tmp, _abi(lr), R1_SP); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
881 |
// Tmp must contain lr on exit! (see return_addr and prolog in ppc64.ad) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
882 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
883 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
884 |
void MacroAssembler::restore_LR_CR(Register tmp) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
885 |
assert(tmp != R1_SP, "must be distinct"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
886 |
ld(tmp, _abi(lr), R1_SP); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
887 |
mtlr(tmp); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
888 |
ld(tmp, _abi(cr), R1_SP); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
889 |
mtcr(tmp); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
890 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
891 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
892 |
address MacroAssembler::get_PC_trash_LR(Register result) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
893 |
Label L; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
894 |
bl(L); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
895 |
bind(L); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
896 |
address lr_pc = pc(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
897 |
mflr(result); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
898 |
return lr_pc; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
899 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
900 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
901 |
void MacroAssembler::resize_frame(Register offset, Register tmp) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
902 |
#ifdef ASSERT |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
903 |
assert_different_registers(offset, tmp, R1_SP); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
904 |
andi_(tmp, offset, frame::alignment_in_bytes-1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
905 |
asm_assert_eq("resize_frame: unaligned", 0x204); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
906 |
#endif |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
907 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
908 |
// tmp <- *(SP) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
909 |
ld(tmp, _abi(callers_sp), R1_SP); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
910 |
// addr <- SP + offset; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
911 |
// *(addr) <- tmp; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
912 |
// SP <- addr |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
913 |
stdux(tmp, R1_SP, offset); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
914 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
915 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
916 |
void MacroAssembler::resize_frame(int offset, Register tmp) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
917 |
assert(is_simm(offset, 16), "too big an offset"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
918 |
assert_different_registers(tmp, R1_SP); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
919 |
assert((offset & (frame::alignment_in_bytes-1))==0, "resize_frame: unaligned"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
920 |
// tmp <- *(SP) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
921 |
ld(tmp, _abi(callers_sp), R1_SP); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
922 |
// addr <- SP + offset; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
923 |
// *(addr) <- tmp; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
924 |
// SP <- addr |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
925 |
stdu(tmp, offset, R1_SP); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
926 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
927 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
928 |
void MacroAssembler::resize_frame_absolute(Register addr, Register tmp1, Register tmp2) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
929 |
// (addr == tmp1) || (addr == tmp2) is allowed here! |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
930 |
assert(tmp1 != tmp2, "must be distinct"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
931 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
932 |
// compute offset w.r.t. current stack pointer |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
933 |
// tmp_1 <- addr - SP (!) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
934 |
subf(tmp1, R1_SP, addr); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
935 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
936 |
// atomically update SP keeping back link. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
937 |
resize_frame(tmp1/* offset */, tmp2/* tmp */); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
938 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
939 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
940 |
void MacroAssembler::push_frame(Register bytes, Register tmp) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
941 |
#ifdef ASSERT |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
942 |
assert(bytes != R0, "r0 not allowed here"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
943 |
andi_(R0, bytes, frame::alignment_in_bytes-1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
944 |
asm_assert_eq("push_frame(Reg, Reg): unaligned", 0x203); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
945 |
#endif |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
946 |
neg(tmp, bytes); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
947 |
stdux(R1_SP, R1_SP, tmp); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
948 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
949 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
950 |
// Push a frame of size `bytes'. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
951 |
void MacroAssembler::push_frame(unsigned int bytes, Register tmp) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
952 |
long offset = align_addr(bytes, frame::alignment_in_bytes); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
953 |
if (is_simm(-offset, 16)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
954 |
stdu(R1_SP, -offset, R1_SP); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
955 |
} else { |
35085 | 956 |
load_const_optimized(tmp, -offset); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
957 |
stdux(R1_SP, R1_SP, tmp); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
958 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
959 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
960 |
|
23211 | 961 |
// Push a frame of size `bytes' plus abi_reg_args on top. |
962 |
void MacroAssembler::push_frame_reg_args(unsigned int bytes, Register tmp) { |
|
963 |
push_frame(bytes + frame::abi_reg_args_size, tmp); |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
964 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
965 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
966 |
// Setup up a new C frame with a spill area for non-volatile GPRs and |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
967 |
// additional space for local variables. |
23211 | 968 |
void MacroAssembler::push_frame_reg_args_nonvolatiles(unsigned int bytes, |
969 |
Register tmp) { |
|
970 |
push_frame(bytes + frame::abi_reg_args_size + frame::spill_nonvolatiles_size, tmp); |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
971 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
972 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
973 |
// Pop current C frame. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
974 |
void MacroAssembler::pop_frame() { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
975 |
ld(R1_SP, _abi(callers_sp), R1_SP); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
976 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
977 |
|
23211 | 978 |
#if defined(ABI_ELFv2) |
979 |
address MacroAssembler::branch_to(Register r_function_entry, bool and_link) { |
|
980 |
// TODO(asmundak): make sure the caller uses R12 as function descriptor |
|
981 |
// most of the times. |
|
982 |
if (R12 != r_function_entry) { |
|
983 |
mr(R12, r_function_entry); |
|
984 |
} |
|
985 |
mtctr(R12); |
|
986 |
// Do a call or a branch. |
|
987 |
if (and_link) { |
|
988 |
bctrl(); |
|
989 |
} else { |
|
990 |
bctr(); |
|
991 |
} |
|
992 |
_last_calls_return_pc = pc(); |
|
993 |
||
994 |
return _last_calls_return_pc; |
|
995 |
} |
|
996 |
||
997 |
// Call a C function via a function descriptor and use full C |
|
998 |
// calling conventions. Updates and returns _last_calls_return_pc. |
|
999 |
address MacroAssembler::call_c(Register r_function_entry) { |
|
1000 |
return branch_to(r_function_entry, /*and_link=*/true); |
|
1001 |
} |
|
1002 |
||
1003 |
// For tail calls: only branch, don't link, so callee returns to caller of this function. |
|
1004 |
address MacroAssembler::call_c_and_return_to_caller(Register r_function_entry) { |
|
1005 |
return branch_to(r_function_entry, /*and_link=*/false); |
|
1006 |
} |
|
1007 |
||
1008 |
address MacroAssembler::call_c(address function_entry, relocInfo::relocType rt) { |
|
1009 |
load_const(R12, function_entry, R0); |
|
1010 |
return branch_to(R12, /*and_link=*/true); |
|
1011 |
} |
|
1012 |
||
1013 |
#else |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1014 |
// Generic version of a call to C function via a function descriptor |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1015 |
// with variable support for C calling conventions (TOC, ENV, etc.). |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1016 |
// Updates and returns _last_calls_return_pc. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1017 |
address MacroAssembler::branch_to(Register function_descriptor, bool and_link, bool save_toc_before_call, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1018 |
bool restore_toc_after_call, bool load_toc_of_callee, bool load_env_of_callee) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1019 |
// we emit standard ptrgl glue code here |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1020 |
assert((function_descriptor != R0), "function_descriptor cannot be R0"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1021 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1022 |
// retrieve necessary entries from the function descriptor |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1023 |
ld(R0, in_bytes(FunctionDescriptor::entry_offset()), function_descriptor); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1024 |
mtctr(R0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1025 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1026 |
if (load_toc_of_callee) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1027 |
ld(R2_TOC, in_bytes(FunctionDescriptor::toc_offset()), function_descriptor); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1028 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1029 |
if (load_env_of_callee) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1030 |
ld(R11, in_bytes(FunctionDescriptor::env_offset()), function_descriptor); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1031 |
} else if (load_toc_of_callee) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1032 |
li(R11, 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1033 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1034 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1035 |
// do a call or a branch |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1036 |
if (and_link) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1037 |
bctrl(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1038 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1039 |
bctr(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1040 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1041 |
_last_calls_return_pc = pc(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1042 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1043 |
return _last_calls_return_pc; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1044 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1045 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1046 |
// Call a C function via a function descriptor and use full C calling |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1047 |
// conventions. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1048 |
// We don't use the TOC in generated code, so there is no need to save |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1049 |
// and restore its value. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1050 |
address MacroAssembler::call_c(Register fd) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1051 |
return branch_to(fd, /*and_link=*/true, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1052 |
/*save toc=*/false, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1053 |
/*restore toc=*/false, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1054 |
/*load toc=*/true, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1055 |
/*load env=*/true); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1056 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1057 |
|
22861 | 1058 |
address MacroAssembler::call_c_and_return_to_caller(Register fd) { |
1059 |
return branch_to(fd, /*and_link=*/false, |
|
1060 |
/*save toc=*/false, |
|
1061 |
/*restore toc=*/false, |
|
1062 |
/*load toc=*/true, |
|
1063 |
/*load env=*/true); |
|
1064 |
} |
|
1065 |
||
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1066 |
address MacroAssembler::call_c(const FunctionDescriptor* fd, relocInfo::relocType rt) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1067 |
if (rt != relocInfo::none) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1068 |
// this call needs to be relocatable |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1069 |
if (!ReoptimizeCallSequences |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1070 |
|| (rt != relocInfo::runtime_call_type && rt != relocInfo::none) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1071 |
|| fd == NULL // support code-size estimation |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1072 |
|| !fd->is_friend_function() |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1073 |
|| fd->entry() == NULL) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1074 |
// it's not a friend function as defined by class FunctionDescriptor, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1075 |
// so do a full call-c here. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1076 |
load_const(R11, (address)fd, R0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1077 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1078 |
bool has_env = (fd != NULL && fd->env() != NULL); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1079 |
return branch_to(R11, /*and_link=*/true, |
22867 | 1080 |
/*save toc=*/false, |
1081 |
/*restore toc=*/false, |
|
1082 |
/*load toc=*/true, |
|
1083 |
/*load env=*/has_env); |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1084 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1085 |
// It's a friend function. Load the entry point and don't care about |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1086 |
// toc and env. Use an optimizable call instruction, but ensure the |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1087 |
// same code-size as in the case of a non-friend function. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1088 |
nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1089 |
nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1090 |
nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1091 |
bl64_patchable(fd->entry(), rt); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1092 |
_last_calls_return_pc = pc(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1093 |
return _last_calls_return_pc; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1094 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1095 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1096 |
// This call does not need to be relocatable, do more aggressive |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1097 |
// optimizations. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1098 |
if (!ReoptimizeCallSequences |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1099 |
|| !fd->is_friend_function()) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1100 |
// It's not a friend function as defined by class FunctionDescriptor, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1101 |
// so do a full call-c here. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1102 |
load_const(R11, (address)fd, R0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1103 |
return branch_to(R11, /*and_link=*/true, |
22867 | 1104 |
/*save toc=*/false, |
1105 |
/*restore toc=*/false, |
|
1106 |
/*load toc=*/true, |
|
1107 |
/*load env=*/true); |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1108 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1109 |
// it's a friend function, load the entry point and don't care about |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1110 |
// toc and env. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1111 |
address dest = fd->entry(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1112 |
if (is_within_range_of_b(dest, pc())) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1113 |
bl(dest); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1114 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1115 |
bl64_patchable(dest, rt); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1116 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1117 |
_last_calls_return_pc = pc(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1118 |
return _last_calls_return_pc; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1119 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1120 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1121 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1122 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1123 |
// Call a C function. All constants needed reside in TOC. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1124 |
// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1125 |
// Read the address to call from the TOC. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1126 |
// Read env from TOC, if fd specifies an env. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1127 |
// Read new TOC from TOC. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1128 |
address MacroAssembler::call_c_using_toc(const FunctionDescriptor* fd, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1129 |
relocInfo::relocType rt, Register toc) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1130 |
if (!ReoptimizeCallSequences |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1131 |
|| (rt != relocInfo::runtime_call_type && rt != relocInfo::none) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1132 |
|| !fd->is_friend_function()) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1133 |
// It's not a friend function as defined by class FunctionDescriptor, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1134 |
// so do a full call-c here. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1135 |
assert(fd->entry() != NULL, "function must be linked"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1136 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1137 |
AddressLiteral fd_entry(fd->entry()); |
35085 | 1138 |
bool success = load_const_from_method_toc(R11, fd_entry, toc, /*fixed_size*/ true); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1139 |
mtctr(R11); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1140 |
if (fd->env() == NULL) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1141 |
li(R11, 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1142 |
nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1143 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1144 |
AddressLiteral fd_env(fd->env()); |
35085 | 1145 |
success = success && load_const_from_method_toc(R11, fd_env, toc, /*fixed_size*/ true); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1146 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1147 |
AddressLiteral fd_toc(fd->toc()); |
35085 | 1148 |
// Set R2_TOC (load from toc) |
1149 |
success = success && load_const_from_method_toc(R2_TOC, fd_toc, toc, /*fixed_size*/ true); |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1150 |
bctrl(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1151 |
_last_calls_return_pc = pc(); |
35085 | 1152 |
if (!success) { return NULL; } |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1153 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1154 |
// It's a friend function, load the entry point and don't care about |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1155 |
// toc and env. Use an optimizable call instruction, but ensure the |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1156 |
// same code-size as in the case of a non-friend function. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1157 |
nop(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1158 |
bl64_patchable(fd->entry(), rt); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1159 |
_last_calls_return_pc = pc(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1160 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1161 |
return _last_calls_return_pc; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1162 |
} |
23492 | 1163 |
#endif // ABI_ELFv2 |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1164 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1165 |
void MacroAssembler::call_VM_base(Register oop_result, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1166 |
Register last_java_sp, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1167 |
address entry_point, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1168 |
bool check_exceptions) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1169 |
BLOCK_COMMENT("call_VM {"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1170 |
// Determine last_java_sp register. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1171 |
if (!last_java_sp->is_valid()) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1172 |
last_java_sp = R1_SP; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1173 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1174 |
set_top_ijava_frame_at_SP_as_last_Java_frame(last_java_sp, R11_scratch1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1175 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1176 |
// ARG1 must hold thread address. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1177 |
mr(R3_ARG1, R16_thread); |
23211 | 1178 |
#if defined(ABI_ELFv2) |
1179 |
address return_pc = call_c(entry_point, relocInfo::none); |
|
1180 |
#else |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1181 |
address return_pc = call_c((FunctionDescriptor*)entry_point, relocInfo::none); |
23211 | 1182 |
#endif |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1183 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1184 |
reset_last_Java_frame(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1185 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1186 |
// Check for pending exceptions. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1187 |
if (check_exceptions) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1188 |
// We don't check for exceptions here. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1189 |
ShouldNotReachHere(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1190 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1191 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1192 |
// Get oop result if there is one and reset the value in the thread. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1193 |
if (oop_result->is_valid()) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1194 |
get_vm_result(oop_result); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1195 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1196 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1197 |
_last_calls_return_pc = return_pc; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1198 |
BLOCK_COMMENT("} call_VM"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1199 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1200 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1201 |
void MacroAssembler::call_VM_leaf_base(address entry_point) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1202 |
BLOCK_COMMENT("call_VM_leaf {"); |
23211 | 1203 |
#if defined(ABI_ELFv2) |
1204 |
call_c(entry_point, relocInfo::none); |
|
1205 |
#else |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1206 |
call_c(CAST_FROM_FN_PTR(FunctionDescriptor*, entry_point), relocInfo::none); |
23211 | 1207 |
#endif |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1208 |
BLOCK_COMMENT("} call_VM_leaf"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1209 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1210 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1211 |
void MacroAssembler::call_VM(Register oop_result, address entry_point, bool check_exceptions) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1212 |
call_VM_base(oop_result, noreg, entry_point, check_exceptions); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1213 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1214 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1215 |
void MacroAssembler::call_VM(Register oop_result, address entry_point, Register arg_1, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1216 |
bool check_exceptions) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1217 |
// R3_ARG1 is reserved for the thread. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1218 |
mr_if_needed(R4_ARG2, arg_1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1219 |
call_VM(oop_result, entry_point, check_exceptions); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1220 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1221 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1222 |
void MacroAssembler::call_VM(Register oop_result, address entry_point, Register arg_1, Register arg_2, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1223 |
bool check_exceptions) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1224 |
// R3_ARG1 is reserved for the thread |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1225 |
mr_if_needed(R4_ARG2, arg_1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1226 |
assert(arg_2 != R4_ARG2, "smashed argument"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1227 |
mr_if_needed(R5_ARG3, arg_2); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1228 |
call_VM(oop_result, entry_point, check_exceptions); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1229 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1230 |
|
28187
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
1231 |
void MacroAssembler::call_VM(Register oop_result, address entry_point, Register arg_1, Register arg_2, Register arg_3, |
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
1232 |
bool check_exceptions) { |
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
1233 |
// R3_ARG1 is reserved for the thread |
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
1234 |
mr_if_needed(R4_ARG2, arg_1); |
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
1235 |
assert(arg_2 != R4_ARG2, "smashed argument"); |
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
1236 |
mr_if_needed(R5_ARG3, arg_2); |
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
1237 |
mr_if_needed(R6_ARG4, arg_3); |
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
1238 |
call_VM(oop_result, entry_point, check_exceptions); |
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
1239 |
} |
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
1240 |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1241 |
void MacroAssembler::call_VM_leaf(address entry_point) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1242 |
call_VM_leaf_base(entry_point); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1243 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1244 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1245 |
void MacroAssembler::call_VM_leaf(address entry_point, Register arg_1) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1246 |
mr_if_needed(R3_ARG1, arg_1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1247 |
call_VM_leaf(entry_point); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1248 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1249 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1250 |
void MacroAssembler::call_VM_leaf(address entry_point, Register arg_1, Register arg_2) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1251 |
mr_if_needed(R3_ARG1, arg_1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1252 |
assert(arg_2 != R3_ARG1, "smashed argument"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1253 |
mr_if_needed(R4_ARG2, arg_2); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1254 |
call_VM_leaf(entry_point); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1255 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1256 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1257 |
void MacroAssembler::call_VM_leaf(address entry_point, Register arg_1, Register arg_2, Register arg_3) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1258 |
mr_if_needed(R3_ARG1, arg_1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1259 |
assert(arg_2 != R3_ARG1, "smashed argument"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1260 |
mr_if_needed(R4_ARG2, arg_2); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1261 |
assert(arg_3 != R3_ARG1 && arg_3 != R4_ARG2, "smashed argument"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1262 |
mr_if_needed(R5_ARG3, arg_3); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1263 |
call_VM_leaf(entry_point); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1264 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1265 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1266 |
// Check whether instruction is a read access to the polling page |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1267 |
// which was emitted by load_from_polling_page(..). |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1268 |
bool MacroAssembler::is_load_from_polling_page(int instruction, void* ucontext, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1269 |
address* polling_address_ptr) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1270 |
if (!is_ld(instruction)) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1271 |
return false; // It's not a ld. Fail. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1272 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1273 |
int rt = inv_rt_field(instruction); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1274 |
int ra = inv_ra_field(instruction); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1275 |
int ds = inv_ds_field(instruction); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1276 |
if (!(ds == 0 && ra != 0 && rt == 0)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1277 |
return false; // It's not a ld(r0, X, ra). Fail. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1278 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1279 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1280 |
if (!ucontext) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1281 |
// Set polling address. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1282 |
if (polling_address_ptr != NULL) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1283 |
*polling_address_ptr = NULL; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1284 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1285 |
return true; // No ucontext given. Can't check value of ra. Assume true. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1286 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1287 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1288 |
#ifdef LINUX |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1289 |
// Ucontext given. Check that register ra contains the address of |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1290 |
// the safepoing polling page. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1291 |
ucontext_t* uc = (ucontext_t*) ucontext; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1292 |
// Set polling address. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1293 |
address addr = (address)uc->uc_mcontext.regs->gpr[ra] + (ssize_t)ds; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1294 |
if (polling_address_ptr != NULL) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1295 |
*polling_address_ptr = addr; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1296 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1297 |
return os::is_poll_address(addr); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1298 |
#else |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1299 |
// Not on Linux, ucontext must be NULL. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1300 |
ShouldNotReachHere(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1301 |
return false; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1302 |
#endif |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1303 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1304 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1305 |
bool MacroAssembler::is_memory_serialization(int instruction, JavaThread* thread, void* ucontext) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1306 |
#ifdef LINUX |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1307 |
ucontext_t* uc = (ucontext_t*) ucontext; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1308 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1309 |
if (is_stwx(instruction) || is_stwux(instruction)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1310 |
int ra = inv_ra_field(instruction); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1311 |
int rb = inv_rb_field(instruction); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1312 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1313 |
// look up content of ra and rb in ucontext |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1314 |
address ra_val=(address)uc->uc_mcontext.regs->gpr[ra]; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1315 |
long rb_val=(long)uc->uc_mcontext.regs->gpr[rb]; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1316 |
return os::is_memory_serialize_page(thread, ra_val+rb_val); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1317 |
} else if (is_stw(instruction) || is_stwu(instruction)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1318 |
int ra = inv_ra_field(instruction); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1319 |
int d1 = inv_d1_field(instruction); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1320 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1321 |
// look up content of ra in ucontext |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1322 |
address ra_val=(address)uc->uc_mcontext.regs->gpr[ra]; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1323 |
return os::is_memory_serialize_page(thread, ra_val+d1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1324 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1325 |
return false; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1326 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1327 |
#else |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1328 |
// workaround not needed on !LINUX :-) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1329 |
ShouldNotCallThis(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1330 |
return false; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1331 |
#endif |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1332 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1333 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1334 |
void MacroAssembler::bang_stack_with_offset(int offset) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1335 |
// When increasing the stack, the old stack pointer will be written |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1336 |
// to the new top of stack according to the PPC64 abi. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1337 |
// Therefore, stack banging is not necessary when increasing |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1338 |
// the stack by <= os::vm_page_size() bytes. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1339 |
// When increasing the stack by a larger amount, this method is |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1340 |
// called repeatedly to bang the intermediate pages. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1341 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1342 |
// Stack grows down, caller passes positive offset. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1343 |
assert(offset > 0, "must bang with positive offset"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1344 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1345 |
long stdoffset = -offset; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1346 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1347 |
if (is_simm(stdoffset, 16)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1348 |
// Signed 16 bit offset, a simple std is ok. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1349 |
if (UseLoadInstructionsForStackBangingPPC64) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1350 |
ld(R0, (int)(signed short)stdoffset, R1_SP); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1351 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1352 |
std(R0,(int)(signed short)stdoffset, R1_SP); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1353 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1354 |
} else if (is_simm(stdoffset, 31)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1355 |
const int hi = MacroAssembler::largeoffset_si16_si16_hi(stdoffset); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1356 |
const int lo = MacroAssembler::largeoffset_si16_si16_lo(stdoffset); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1357 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1358 |
Register tmp = R11; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1359 |
addis(tmp, R1_SP, hi); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1360 |
if (UseLoadInstructionsForStackBangingPPC64) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1361 |
ld(R0, lo, tmp); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1362 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1363 |
std(R0, lo, tmp); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1364 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1365 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1366 |
ShouldNotReachHere(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1367 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1368 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1369 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1370 |
// If instruction is a stack bang of the form |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1371 |
// std R0, x(Ry), (see bang_stack_with_offset()) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1372 |
// stdu R1_SP, x(R1_SP), (see push_frame(), resize_frame()) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1373 |
// or stdux R1_SP, Rx, R1_SP (see push_frame(), resize_frame()) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1374 |
// return the banged address. Otherwise, return 0. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1375 |
address MacroAssembler::get_stack_bang_address(int instruction, void *ucontext) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1376 |
#ifdef LINUX |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1377 |
ucontext_t* uc = (ucontext_t*) ucontext; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1378 |
int rs = inv_rs_field(instruction); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1379 |
int ra = inv_ra_field(instruction); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1380 |
if ( (is_ld(instruction) && rs == 0 && UseLoadInstructionsForStackBangingPPC64) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1381 |
|| (is_std(instruction) && rs == 0 && !UseLoadInstructionsForStackBangingPPC64) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1382 |
|| (is_stdu(instruction) && rs == 1)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1383 |
int ds = inv_ds_field(instruction); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1384 |
// return banged address |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1385 |
return ds+(address)uc->uc_mcontext.regs->gpr[ra]; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1386 |
} else if (is_stdux(instruction) && rs == 1) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1387 |
int rb = inv_rb_field(instruction); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1388 |
address sp = (address)uc->uc_mcontext.regs->gpr[1]; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1389 |
long rb_val = (long)uc->uc_mcontext.regs->gpr[rb]; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1390 |
return ra != 1 || rb_val >= 0 ? NULL // not a stack bang |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1391 |
: sp + rb_val; // banged address |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1392 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1393 |
return NULL; // not a stack bang |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1394 |
#else |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1395 |
// workaround not needed on !LINUX :-) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1396 |
ShouldNotCallThis(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1397 |
return NULL; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1398 |
#endif |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1399 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1400 |
|
38931
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1401 |
void MacroAssembler::reserved_stack_check(Register return_pc) { |
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1402 |
// Test if reserved zone needs to be enabled. |
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1403 |
Label no_reserved_zone_enabling; |
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1404 |
|
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1405 |
ld_ptr(R0, JavaThread::reserved_stack_activation_offset(), R16_thread); |
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1406 |
cmpld(CCR0, R1_SP, R0); |
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1407 |
blt_predict_taken(CCR0, no_reserved_zone_enabling); |
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1408 |
|
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1409 |
// Enable reserved zone again, throw stack overflow exception. |
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1410 |
push_frame_reg_args(0, R0); |
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1411 |
call_VM_leaf(CAST_FROM_FN_PTR(address, SharedRuntime::enable_stack_reserved_zone), R16_thread); |
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1412 |
pop_frame(); |
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1413 |
mtlr(return_pc); |
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1414 |
load_const_optimized(R0, StubRoutines::throw_delayed_StackOverflowError_entry()); |
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1415 |
mtctr(R0); |
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1416 |
bctr(); |
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1417 |
|
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1418 |
should_not_reach_here(); |
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1419 |
|
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1420 |
bind(no_reserved_zone_enabling); |
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1421 |
} |
3cf28d630349
8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents:
38685
diff
changeset
|
1422 |
|
39444
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1423 |
void MacroAssembler::getandsetd(Register dest_current_value, Register exchange_value, Register addr_base, |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1424 |
bool cmpxchgx_hint) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1425 |
Label retry; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1426 |
bind(retry); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1427 |
ldarx(dest_current_value, addr_base, cmpxchgx_hint); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1428 |
stdcx_(exchange_value, addr_base); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1429 |
if (UseStaticBranchPredictionInCompareAndSwapPPC64) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1430 |
bne_predict_not_taken(CCR0, retry); // StXcx_ sets CCR0. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1431 |
} else { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1432 |
bne( CCR0, retry); // StXcx_ sets CCR0. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1433 |
} |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1434 |
} |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1435 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1436 |
void MacroAssembler::getandaddd(Register dest_current_value, Register inc_value, Register addr_base, |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1437 |
Register tmp, bool cmpxchgx_hint) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1438 |
Label retry; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1439 |
bind(retry); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1440 |
ldarx(dest_current_value, addr_base, cmpxchgx_hint); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1441 |
add(tmp, dest_current_value, inc_value); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1442 |
stdcx_(tmp, addr_base); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1443 |
if (UseStaticBranchPredictionInCompareAndSwapPPC64) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1444 |
bne_predict_not_taken(CCR0, retry); // StXcx_ sets CCR0. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1445 |
} else { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1446 |
bne( CCR0, retry); // StXcx_ sets CCR0. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1447 |
} |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1448 |
} |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1449 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1450 |
// Word/sub-word atomic helper functions |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1451 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1452 |
// Temps and addr_base are killed if size < 4 and processor does not support respective instructions. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1453 |
// Only signed types are supported with size < 4. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1454 |
// Atomic add always kills tmp1. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1455 |
void MacroAssembler::atomic_get_and_modify_generic(Register dest_current_value, Register exchange_value, |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1456 |
Register addr_base, Register tmp1, Register tmp2, Register tmp3, |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1457 |
bool cmpxchgx_hint, bool is_add, int size) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1458 |
// Sub-word instructions are available since Power 8. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1459 |
// For older processors, instruction_type != size holds, and we |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1460 |
// emulate the sub-word instructions by constructing a 4-byte value |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1461 |
// that leaves the other bytes unchanged. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1462 |
const int instruction_type = VM_Version::has_lqarx() ? size : 4; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1463 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1464 |
Label retry; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1465 |
Register shift_amount = noreg, |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1466 |
val32 = dest_current_value, |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1467 |
modval = is_add ? tmp1 : exchange_value; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1468 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1469 |
if (instruction_type != size) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1470 |
assert_different_registers(tmp1, tmp2, tmp3, dest_current_value, exchange_value, addr_base); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1471 |
modval = tmp1; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1472 |
shift_amount = tmp2; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1473 |
val32 = tmp3; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1474 |
// Need some preperation: Compute shift amount, align address. Note: shorts must be 2 byte aligned. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1475 |
#ifdef VM_LITTLE_ENDIAN |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1476 |
rldic(shift_amount, addr_base, 3, 64-5); // (dest & 3) * 8; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1477 |
clrrdi(addr_base, addr_base, 2); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1478 |
#else |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1479 |
xori(shift_amount, addr_base, (size == 1) ? 3 : 2); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1480 |
clrrdi(addr_base, addr_base, 2); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1481 |
rldic(shift_amount, shift_amount, 3, 64-5); // byte: ((3-dest) & 3) * 8; short: ((1-dest/2) & 1) * 16; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1482 |
#endif |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1483 |
} |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1484 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1485 |
// atomic emulation loop |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1486 |
bind(retry); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1487 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1488 |
switch (instruction_type) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1489 |
case 4: lwarx(val32, addr_base, cmpxchgx_hint); break; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1490 |
case 2: lharx(val32, addr_base, cmpxchgx_hint); break; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1491 |
case 1: lbarx(val32, addr_base, cmpxchgx_hint); break; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1492 |
default: ShouldNotReachHere(); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1493 |
} |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1494 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1495 |
if (instruction_type != size) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1496 |
srw(dest_current_value, val32, shift_amount); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1497 |
} |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1498 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1499 |
if (is_add) { add(modval, dest_current_value, exchange_value); } |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1500 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1501 |
if (instruction_type != size) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1502 |
// Transform exchange value such that the replacement can be done by one xor instruction. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1503 |
xorr(modval, dest_current_value, is_add ? modval : exchange_value); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1504 |
clrldi(modval, modval, (size == 1) ? 56 : 48); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1505 |
slw(modval, modval, shift_amount); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1506 |
xorr(modval, val32, modval); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1507 |
} |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1508 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1509 |
switch (instruction_type) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1510 |
case 4: stwcx_(modval, addr_base); break; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1511 |
case 2: sthcx_(modval, addr_base); break; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1512 |
case 1: stbcx_(modval, addr_base); break; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1513 |
default: ShouldNotReachHere(); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1514 |
} |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1515 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1516 |
if (UseStaticBranchPredictionInCompareAndSwapPPC64) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1517 |
bne_predict_not_taken(CCR0, retry); // StXcx_ sets CCR0. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1518 |
} else { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1519 |
bne( CCR0, retry); // StXcx_ sets CCR0. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1520 |
} |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1521 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1522 |
// l?arx zero-extends, but Java wants byte/short values sign-extended. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1523 |
if (size == 1) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1524 |
extsb(dest_current_value, dest_current_value); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1525 |
} else if (size == 2) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1526 |
extsh(dest_current_value, dest_current_value); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1527 |
}; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1528 |
} |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1529 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1530 |
// Temps, addr_base and exchange_value are killed if size < 4 and processor does not support respective instructions. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1531 |
// Only signed types are supported with size < 4. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1532 |
void MacroAssembler::cmpxchg_loop_body(ConditionRegister flag, Register dest_current_value, |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1533 |
Register compare_value, Register exchange_value, |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1534 |
Register addr_base, Register tmp1, Register tmp2, |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1535 |
Label &retry, Label &failed, bool cmpxchgx_hint, int size) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1536 |
// Sub-word instructions are available since Power 8. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1537 |
// For older processors, instruction_type != size holds, and we |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1538 |
// emulate the sub-word instructions by constructing a 4-byte value |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1539 |
// that leaves the other bytes unchanged. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1540 |
const int instruction_type = VM_Version::has_lqarx() ? size : 4; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1541 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1542 |
Register shift_amount = noreg, |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1543 |
val32 = dest_current_value, |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1544 |
modval = exchange_value; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1545 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1546 |
if (instruction_type != size) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1547 |
assert_different_registers(tmp1, tmp2, dest_current_value, compare_value, exchange_value, addr_base); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1548 |
shift_amount = tmp1; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1549 |
val32 = tmp2; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1550 |
modval = tmp2; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1551 |
// Need some preperation: Compute shift amount, align address. Note: shorts must be 2 byte aligned. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1552 |
#ifdef VM_LITTLE_ENDIAN |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1553 |
rldic(shift_amount, addr_base, 3, 64-5); // (dest & 3) * 8; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1554 |
clrrdi(addr_base, addr_base, 2); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1555 |
#else |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1556 |
xori(shift_amount, addr_base, (size == 1) ? 3 : 2); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1557 |
clrrdi(addr_base, addr_base, 2); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1558 |
rldic(shift_amount, shift_amount, 3, 64-5); // byte: ((3-dest) & 3) * 8; short: ((1-dest/2) & 1) * 16; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1559 |
#endif |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1560 |
// Transform exchange value such that the replacement can be done by one xor instruction. |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1561 |
xorr(exchange_value, compare_value, exchange_value); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1562 |
clrldi(exchange_value, exchange_value, (size == 1) ? 56 : 48); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1563 |
slw(exchange_value, exchange_value, shift_amount); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1564 |
} |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1565 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1566 |
// atomic emulation loop |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1567 |
bind(retry); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1568 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1569 |
switch (instruction_type) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1570 |
case 4: lwarx(val32, addr_base, cmpxchgx_hint); break; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1571 |
case 2: lharx(val32, addr_base, cmpxchgx_hint); break; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1572 |
case 1: lbarx(val32, addr_base, cmpxchgx_hint); break; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1573 |
default: ShouldNotReachHere(); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1574 |
} |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1575 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1576 |
if (instruction_type != size) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1577 |
srw(dest_current_value, val32, shift_amount); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1578 |
} |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1579 |
if (size == 1) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1580 |
extsb(dest_current_value, dest_current_value); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1581 |
} else if (size == 2) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1582 |
extsh(dest_current_value, dest_current_value); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1583 |
}; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1584 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1585 |
cmpw(flag, dest_current_value, compare_value); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1586 |
if (UseStaticBranchPredictionInCompareAndSwapPPC64) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1587 |
bne_predict_not_taken(flag, failed); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1588 |
} else { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1589 |
bne( flag, failed); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1590 |
} |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1591 |
// branch to done => (flag == ne), (dest_current_value != compare_value) |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1592 |
// fall through => (flag == eq), (dest_current_value == compare_value) |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1593 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1594 |
if (instruction_type != size) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1595 |
xorr(modval, val32, exchange_value); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1596 |
} |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1597 |
|
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1598 |
switch (instruction_type) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1599 |
case 4: stwcx_(modval, addr_base); break; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1600 |
case 2: sthcx_(modval, addr_base); break; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1601 |
case 1: stbcx_(modval, addr_base); break; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1602 |
default: ShouldNotReachHere(); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1603 |
} |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1604 |
} |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1605 |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1606 |
// CmpxchgX sets condition register to cmpX(current, compare). |
39444
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1607 |
void MacroAssembler::cmpxchg_generic(ConditionRegister flag, Register dest_current_value, |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1608 |
Register compare_value, Register exchange_value, |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1609 |
Register addr_base, Register tmp1, Register tmp2, |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1610 |
int semantics, bool cmpxchgx_hint, |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1611 |
Register int_flag_success, bool contention_hint, bool weak, int size) { |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1612 |
Label retry; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1613 |
Label failed; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1614 |
Label done; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1615 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1616 |
// Save one branch if result is returned via register and |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1617 |
// result register is different from the other ones. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1618 |
bool use_result_reg = (int_flag_success != noreg); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1619 |
bool preset_result_reg = (int_flag_success != dest_current_value && int_flag_success != compare_value && |
39444
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1620 |
int_flag_success != exchange_value && int_flag_success != addr_base && |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1621 |
int_flag_success != tmp1 && int_flag_success != tmp2); |
38685
e34308190947
8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents:
38074
diff
changeset
|
1622 |
assert(!weak || flag == CCR0, "weak only supported with CCR0"); |
39444
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1623 |
assert(size == 1 || size == 2 || size == 4, "unsupported"); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1624 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1625 |
if (use_result_reg && preset_result_reg) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1626 |
li(int_flag_success, 0); // preset (assume cas failed) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1627 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1628 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1629 |
// Add simple guard in order to reduce risk of starving under high contention (recommended by IBM). |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1630 |
if (contention_hint) { // Don't try to reserve if cmp fails. |
39444
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1631 |
switch (size) { |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1632 |
case 1: lbz(dest_current_value, 0, addr_base); extsb(dest_current_value, dest_current_value); break; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1633 |
case 2: lha(dest_current_value, 0, addr_base); break; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1634 |
case 4: lwz(dest_current_value, 0, addr_base); break; |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1635 |
default: ShouldNotReachHere(); |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1636 |
} |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1637 |
cmpw(flag, dest_current_value, compare_value); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1638 |
bne(flag, failed); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1639 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1640 |
|
35085 | 1641 |
// release/fence semantics |
1642 |
if (semantics & MemBarRel) { |
|
1643 |
release(); |
|
1644 |
} |
|
1645 |
||
39444
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1646 |
cmpxchg_loop_body(flag, dest_current_value, compare_value, exchange_value, addr_base, tmp1, tmp2, |
2eae9b74c1f3
8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents:
38931
diff
changeset
|
1647 |
retry, failed, cmpxchgx_hint, size); |
38685
e34308190947
8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents:
38074
diff
changeset
|
1648 |
if (!weak || use_result_reg) { |
e34308190947
8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents:
38074
diff
changeset
|
1649 |
if (UseStaticBranchPredictionInCompareAndSwapPPC64) { |
e34308190947
8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents:
38074
diff
changeset
|
1650 |
bne_predict_not_taken(CCR0, weak ? failed : retry); // StXcx_ sets CCR0. |
e34308190947
8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents:
38074
diff
changeset
|
1651 |
} else { |
e34308190947
8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents:
38074
diff
changeset
|
1652 |
bne( CCR0, weak ? failed : retry); // StXcx_ sets CCR0. |
e34308190947
8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents:
38074
diff
changeset
|
1653 |
} |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1654 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1655 |
// fall through => (flag == eq), (dest_current_value == compare_value), (swapped) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1656 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1657 |
// Result in register (must do this at the end because int_flag_success can be the |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1658 |
// same register as one above). |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1659 |
if (use_result_reg) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1660 |
li(int_flag_success, 1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1661 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1662 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1663 |
if (semantics & MemBarFenceAfter) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1664 |
fence(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1665 |
} else if (semantics & MemBarAcq) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1666 |
isync(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1667 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1668 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1669 |
if (use_result_reg && !preset_result_reg) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1670 |
b(done); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1671 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1672 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1673 |
bind(failed); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1674 |
if (use_result_reg && !preset_result_reg) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1675 |
li(int_flag_success, 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1676 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1677 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1678 |
bind(done); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1679 |
// (flag == ne) => (dest_current_value != compare_value), (!swapped) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1680 |
// (flag == eq) => (dest_current_value == compare_value), ( swapped) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1681 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1682 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1683 |
// Preforms atomic compare exchange: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1684 |
// if (compare_value == *addr_base) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1685 |
// *addr_base = exchange_value |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1686 |
// int_flag_success = 1; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1687 |
// else |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1688 |
// int_flag_success = 0; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1689 |
// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1690 |
// ConditionRegister flag = cmp(compare_value, *addr_base) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1691 |
// Register dest_current_value = *addr_base |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1692 |
// Register compare_value Used to compare with value in memory |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1693 |
// Register exchange_value Written to memory if compare_value == *addr_base |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1694 |
// Register addr_base The memory location to compareXChange |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1695 |
// Register int_flag_success Set to 1 if exchange_value was written to *addr_base |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1696 |
// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1697 |
// To avoid the costly compare exchange the value is tested beforehand. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1698 |
// Several special cases exist to avoid that unnecessary information is generated. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1699 |
// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1700 |
void MacroAssembler::cmpxchgd(ConditionRegister flag, |
30303 | 1701 |
Register dest_current_value, RegisterOrConstant compare_value, Register exchange_value, |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1702 |
Register addr_base, int semantics, bool cmpxchgx_hint, |
38685
e34308190947
8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents:
38074
diff
changeset
|
1703 |
Register int_flag_success, Label* failed_ext, bool contention_hint, bool weak) { |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1704 |
Label retry; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1705 |
Label failed_int; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1706 |
Label& failed = (failed_ext != NULL) ? *failed_ext : failed_int; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1707 |
Label done; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1708 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1709 |
// Save one branch if result is returned via register and result register is different from the other ones. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1710 |
bool use_result_reg = (int_flag_success!=noreg); |
30303 | 1711 |
bool preset_result_reg = (int_flag_success!=dest_current_value && int_flag_success!=compare_value.register_or_noreg() && |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1712 |
int_flag_success!=exchange_value && int_flag_success!=addr_base); |
38685
e34308190947
8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents:
38074
diff
changeset
|
1713 |
assert(!weak || flag == CCR0, "weak only supported with CCR0"); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1714 |
assert(int_flag_success == noreg || failed_ext == NULL, "cannot have both"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1715 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1716 |
if (use_result_reg && preset_result_reg) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1717 |
li(int_flag_success, 0); // preset (assume cas failed) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1718 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1719 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1720 |
// Add simple guard in order to reduce risk of starving under high contention (recommended by IBM). |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1721 |
if (contention_hint) { // Don't try to reserve if cmp fails. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1722 |
ld(dest_current_value, 0, addr_base); |
30303 | 1723 |
cmpd(flag, compare_value, dest_current_value); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1724 |
bne(flag, failed); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1725 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1726 |
|
35085 | 1727 |
// release/fence semantics |
1728 |
if (semantics & MemBarRel) { |
|
1729 |
release(); |
|
1730 |
} |
|
1731 |
||
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1732 |
// atomic emulation loop |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1733 |
bind(retry); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1734 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1735 |
ldarx(dest_current_value, addr_base, cmpxchgx_hint); |
30303 | 1736 |
cmpd(flag, compare_value, dest_current_value); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1737 |
if (UseStaticBranchPredictionInCompareAndSwapPPC64) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1738 |
bne_predict_not_taken(flag, failed); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1739 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1740 |
bne( flag, failed); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1741 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1742 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1743 |
stdcx_(exchange_value, addr_base); |
38685
e34308190947
8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents:
38074
diff
changeset
|
1744 |
if (!weak || use_result_reg || failed_ext) { |
e34308190947
8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents:
38074
diff
changeset
|
1745 |
if (UseStaticBranchPredictionInCompareAndSwapPPC64) { |
e34308190947
8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents:
38074
diff
changeset
|
1746 |
bne_predict_not_taken(CCR0, weak ? failed : retry); // stXcx_ sets CCR0 |
e34308190947
8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents:
38074
diff
changeset
|
1747 |
} else { |
e34308190947
8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents:
38074
diff
changeset
|
1748 |
bne( CCR0, weak ? failed : retry); // stXcx_ sets CCR0 |
e34308190947
8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents:
38074
diff
changeset
|
1749 |
} |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1750 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1751 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1752 |
// result in register (must do this at the end because int_flag_success can be the same register as one above) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1753 |
if (use_result_reg) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1754 |
li(int_flag_success, 1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1755 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1756 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1757 |
if (semantics & MemBarFenceAfter) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1758 |
fence(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1759 |
} else if (semantics & MemBarAcq) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1760 |
isync(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1761 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1762 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1763 |
if (use_result_reg && !preset_result_reg) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1764 |
b(done); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1765 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1766 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1767 |
bind(failed_int); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1768 |
if (use_result_reg && !preset_result_reg) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1769 |
li(int_flag_success, 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1770 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1771 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1772 |
bind(done); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1773 |
// (flag == ne) => (dest_current_value != compare_value), (!swapped) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1774 |
// (flag == eq) => (dest_current_value == compare_value), ( swapped) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1775 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1776 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1777 |
// Look up the method for a megamorphic invokeinterface call. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1778 |
// The target method is determined by <intf_klass, itable_index>. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1779 |
// The receiver klass is in recv_klass. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1780 |
// On success, the result will be in method_result, and execution falls through. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1781 |
// On failure, execution transfers to the given label. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1782 |
void MacroAssembler::lookup_interface_method(Register recv_klass, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1783 |
Register intf_klass, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1784 |
RegisterOrConstant itable_index, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1785 |
Register method_result, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1786 |
Register scan_temp, |
48585
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1787 |
Register temp2, |
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1788 |
Label& L_no_such_interface, |
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1789 |
bool return_method) { |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1790 |
assert_different_registers(recv_klass, intf_klass, method_result, scan_temp); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1791 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1792 |
// Compute start of first itableOffsetEntry (which is at the end of the vtable). |
35899 | 1793 |
int vtable_base = in_bytes(Klass::vtable_start_offset()); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1794 |
int itentry_off = itableMethodEntry::method_offset_in_bytes(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1795 |
int logMEsize = exact_log2(itableMethodEntry::size() * wordSize); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1796 |
int scan_step = itableOffsetEntry::size() * wordSize; |
35871
607bf949dfb3
8147461: Use byte offsets for vtable start and vtable length offsets
mgerdin
parents:
35232
diff
changeset
|
1797 |
int log_vte_size= exact_log2(vtableEntry::size_in_bytes()); |
607bf949dfb3
8147461: Use byte offsets for vtable start and vtable length offsets
mgerdin
parents:
35232
diff
changeset
|
1798 |
|
35899 | 1799 |
lwz(scan_temp, in_bytes(Klass::vtable_length_offset()), recv_klass); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1800 |
// %%% We should store the aligned, prescaled offset in the klassoop. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1801 |
// Then the next several instructions would fold away. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1802 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1803 |
sldi(scan_temp, scan_temp, log_vte_size); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1804 |
addi(scan_temp, scan_temp, vtable_base); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1805 |
add(scan_temp, recv_klass, scan_temp); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1806 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1807 |
// Adjust recv_klass by scaled itable_index, so we can free itable_index. |
48585
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1808 |
if (return_method) { |
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1809 |
if (itable_index.is_register()) { |
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1810 |
Register itable_offset = itable_index.as_register(); |
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1811 |
sldi(method_result, itable_offset, logMEsize); |
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1812 |
if (itentry_off) { addi(method_result, method_result, itentry_off); } |
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1813 |
add(method_result, method_result, recv_klass); |
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1814 |
} else { |
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1815 |
long itable_offset = (long)itable_index.as_constant(); |
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1816 |
// static address, no relocation |
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1817 |
add_const_optimized(method_result, recv_klass, (itable_offset << logMEsize) + itentry_off, temp2); |
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1818 |
} |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1819 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1820 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1821 |
// for (scan = klass->itable(); scan->interface() != NULL; scan += scan_step) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1822 |
// if (scan->interface() == intf) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1823 |
// result = (klass + scan->offset() + itable_index); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1824 |
// } |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1825 |
// } |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1826 |
Label search, found_method; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1827 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1828 |
for (int peel = 1; peel >= 0; peel--) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1829 |
// %%%% Could load both offset and interface in one ldx, if they were |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1830 |
// in the opposite order. This would save a load. |
48585
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1831 |
ld(temp2, itableOffsetEntry::interface_offset_in_bytes(), scan_temp); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1832 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1833 |
// Check that this entry is non-null. A null entry means that |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1834 |
// the receiver class doesn't implement the interface, and wasn't the |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1835 |
// same as when the caller was compiled. |
48585
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1836 |
cmpd(CCR0, temp2, intf_klass); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1837 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1838 |
if (peel) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1839 |
beq(CCR0, found_method); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1840 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1841 |
bne(CCR0, search); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1842 |
// (invert the test to fall through to found_method...) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1843 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1844 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1845 |
if (!peel) break; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1846 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1847 |
bind(search); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1848 |
|
48585
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1849 |
cmpdi(CCR0, temp2, 0); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1850 |
beq(CCR0, L_no_such_interface); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1851 |
addi(scan_temp, scan_temp, scan_step); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1852 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1853 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1854 |
bind(found_method); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1855 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1856 |
// Got a hit. |
48585
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1857 |
if (return_method) { |
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1858 |
int ito_offset = itableOffsetEntry::offset_offset_in_bytes(); |
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1859 |
lwz(scan_temp, ito_offset, scan_temp); |
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1860 |
ldx(method_result, scan_temp, method_result); |
d9fcb7ba8133
8191907: PPC64 and s390 parts of JDK-8174962: Better interface invocations
mdoerr
parents:
48332
diff
changeset
|
1861 |
} |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1862 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1863 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1864 |
// virtual method calling |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1865 |
void MacroAssembler::lookup_virtual_method(Register recv_klass, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1866 |
RegisterOrConstant vtable_index, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1867 |
Register method_result) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1868 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1869 |
assert_different_registers(recv_klass, method_result, vtable_index.register_or_noreg()); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1870 |
|
35899 | 1871 |
const int base = in_bytes(Klass::vtable_start_offset()); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1872 |
assert(vtableEntry::size() * wordSize == wordSize, "adjust the scaling in the code below"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1873 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1874 |
if (vtable_index.is_register()) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1875 |
sldi(vtable_index.as_register(), vtable_index.as_register(), LogBytesPerWord); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1876 |
add(recv_klass, vtable_index.as_register(), recv_klass); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1877 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1878 |
addi(recv_klass, recv_klass, vtable_index.as_constant() << LogBytesPerWord); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1879 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1880 |
ld(R19_method, base + vtableEntry::method_offset_in_bytes(), recv_klass); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1881 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1882 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1883 |
/////////////////////////////////////////// subtype checking //////////////////////////////////////////// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1884 |
void MacroAssembler::check_klass_subtype_fast_path(Register sub_klass, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1885 |
Register super_klass, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1886 |
Register temp1_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1887 |
Register temp2_reg, |
35085 | 1888 |
Label* L_success, |
1889 |
Label* L_failure, |
|
1890 |
Label* L_slow_path, |
|
1891 |
RegisterOrConstant super_check_offset) { |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1892 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1893 |
const Register check_cache_offset = temp1_reg; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1894 |
const Register cached_super = temp2_reg; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1895 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1896 |
assert_different_registers(sub_klass, super_klass, check_cache_offset, cached_super); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1897 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1898 |
int sco_offset = in_bytes(Klass::super_check_offset_offset()); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1899 |
int sc_offset = in_bytes(Klass::secondary_super_cache_offset()); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1900 |
|
35085 | 1901 |
bool must_load_sco = (super_check_offset.constant_or_zero() == -1); |
1902 |
bool need_slow_path = (must_load_sco || super_check_offset.constant_or_zero() == sco_offset); |
|
1903 |
||
1904 |
Label L_fallthrough; |
|
1905 |
int label_nulls = 0; |
|
1906 |
if (L_success == NULL) { L_success = &L_fallthrough; label_nulls++; } |
|
1907 |
if (L_failure == NULL) { L_failure = &L_fallthrough; label_nulls++; } |
|
1908 |
if (L_slow_path == NULL) { L_slow_path = &L_fallthrough; label_nulls++; } |
|
1909 |
assert(label_nulls <= 1 || |
|
1910 |
(L_slow_path == &L_fallthrough && label_nulls <= 2 && !need_slow_path), |
|
1911 |
"at most one NULL in the batch, usually"); |
|
1912 |
||
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1913 |
// If the pointers are equal, we are done (e.g., String[] elements). |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1914 |
// This self-check enables sharing of secondary supertype arrays among |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1915 |
// non-primary types such as array-of-interface. Otherwise, each such |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1916 |
// type would need its own customized SSA. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1917 |
// We move this check to the front of the fast path because many |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1918 |
// type checks are in fact trivially successful in this manner, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1919 |
// so we get a nicely predicted branch right at the start of the check. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1920 |
cmpd(CCR0, sub_klass, super_klass); |
35085 | 1921 |
beq(CCR0, *L_success); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1922 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1923 |
// Check the supertype display: |
35085 | 1924 |
if (must_load_sco) { |
1925 |
// The super check offset is always positive... |
|
42068
18c8a4d5998e
8168083: PPC64: Cleanup template interpreter after 8154580 and 8154867
mdoerr
parents:
41334
diff
changeset
|
1926 |
lwz(check_cache_offset, sco_offset, super_klass); |
35085 | 1927 |
super_check_offset = RegisterOrConstant(check_cache_offset); |
1928 |
// super_check_offset is register. |
|
1929 |
assert_different_registers(sub_klass, super_klass, cached_super, super_check_offset.as_register()); |
|
1930 |
} |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1931 |
// The loaded value is the offset from KlassOopDesc. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1932 |
|
35085 | 1933 |
ld(cached_super, super_check_offset, sub_klass); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1934 |
cmpd(CCR0, cached_super, super_klass); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1935 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1936 |
// This check has worked decisively for primary supers. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1937 |
// Secondary supers are sought in the super_cache ('super_cache_addr'). |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1938 |
// (Secondary supers are interfaces and very deeply nested subtypes.) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1939 |
// This works in the same check above because of a tricky aliasing |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1940 |
// between the super_cache and the primary super display elements. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1941 |
// (The 'super_check_addr' can address either, as the case requires.) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1942 |
// Note that the cache is updated below if it does not help us find |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1943 |
// what we need immediately. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1944 |
// So if it was a primary super, we can just fail immediately. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1945 |
// Otherwise, it's the slow path for us (no success at this point). |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1946 |
|
35085 | 1947 |
#define FINAL_JUMP(label) if (&(label) != &L_fallthrough) { b(label); } |
1948 |
||
1949 |
if (super_check_offset.is_register()) { |
|
1950 |
beq(CCR0, *L_success); |
|
1951 |
cmpwi(CCR0, super_check_offset.as_register(), sc_offset); |
|
1952 |
if (L_failure == &L_fallthrough) { |
|
1953 |
beq(CCR0, *L_slow_path); |
|
1954 |
} else { |
|
1955 |
bne(CCR0, *L_failure); |
|
1956 |
FINAL_JUMP(*L_slow_path); |
|
1957 |
} |
|
1958 |
} else { |
|
1959 |
if (super_check_offset.as_constant() == sc_offset) { |
|
1960 |
// Need a slow path; fast failure is impossible. |
|
1961 |
if (L_slow_path == &L_fallthrough) { |
|
1962 |
beq(CCR0, *L_success); |
|
1963 |
} else { |
|
1964 |
bne(CCR0, *L_slow_path); |
|
1965 |
FINAL_JUMP(*L_success); |
|
1966 |
} |
|
1967 |
} else { |
|
1968 |
// No slow path; it's a fast decision. |
|
1969 |
if (L_failure == &L_fallthrough) { |
|
1970 |
beq(CCR0, *L_success); |
|
1971 |
} else { |
|
1972 |
bne(CCR0, *L_failure); |
|
1973 |
FINAL_JUMP(*L_success); |
|
1974 |
} |
|
1975 |
} |
|
1976 |
} |
|
1977 |
||
1978 |
bind(L_fallthrough); |
|
1979 |
#undef FINAL_JUMP |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1980 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1981 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1982 |
void MacroAssembler::check_klass_subtype_slow_path(Register sub_klass, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1983 |
Register super_klass, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1984 |
Register temp1_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1985 |
Register temp2_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1986 |
Label* L_success, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1987 |
Register result_reg) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1988 |
const Register array_ptr = temp1_reg; // current value from cache array |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1989 |
const Register temp = temp2_reg; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1990 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1991 |
assert_different_registers(sub_klass, super_klass, array_ptr, temp); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1992 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1993 |
int source_offset = in_bytes(Klass::secondary_supers_offset()); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1994 |
int target_offset = in_bytes(Klass::secondary_super_cache_offset()); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1995 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1996 |
int length_offset = Array<Klass*>::length_offset_in_bytes(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1997 |
int base_offset = Array<Klass*>::base_offset_in_bytes(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1998 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
1999 |
Label hit, loop, failure, fallthru; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2000 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2001 |
ld(array_ptr, source_offset, sub_klass); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2002 |
|
35085 | 2003 |
// TODO: PPC port: assert(4 == arrayOopDesc::length_length_in_bytes(), "precondition violated."); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2004 |
lwz(temp, length_offset, array_ptr); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2005 |
cmpwi(CCR0, temp, 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2006 |
beq(CCR0, result_reg!=noreg ? failure : fallthru); // length 0 |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2007 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2008 |
mtctr(temp); // load ctr |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2009 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2010 |
bind(loop); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2011 |
// Oops in table are NO MORE compressed. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2012 |
ld(temp, base_offset, array_ptr); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2013 |
cmpd(CCR0, temp, super_klass); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2014 |
beq(CCR0, hit); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2015 |
addi(array_ptr, array_ptr, BytesPerWord); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2016 |
bdnz(loop); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2017 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2018 |
bind(failure); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2019 |
if (result_reg!=noreg) li(result_reg, 1); // load non-zero result (indicates a miss) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2020 |
b(fallthru); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2021 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2022 |
bind(hit); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2023 |
std(super_klass, target_offset, sub_klass); // save result to cache |
35085 | 2024 |
if (result_reg != noreg) { li(result_reg, 0); } // load zero result (indicates a hit) |
2025 |
if (L_success != NULL) { b(*L_success); } |
|
2026 |
else if (result_reg == noreg) { blr(); } // return with CR0.eq if neither label nor result reg provided |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2027 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2028 |
bind(fallthru); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2029 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2030 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2031 |
// Try fast path, then go to slow one if not successful |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2032 |
void MacroAssembler::check_klass_subtype(Register sub_klass, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2033 |
Register super_klass, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2034 |
Register temp1_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2035 |
Register temp2_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2036 |
Label& L_success) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2037 |
Label L_failure; |
35085 | 2038 |
check_klass_subtype_fast_path(sub_klass, super_klass, temp1_reg, temp2_reg, &L_success, &L_failure); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2039 |
check_klass_subtype_slow_path(sub_klass, super_klass, temp1_reg, temp2_reg, &L_success); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2040 |
bind(L_failure); // Fallthru if not successful. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2041 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2042 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2043 |
void MacroAssembler::check_method_handle_type(Register mtype_reg, Register mh_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2044 |
Register temp_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2045 |
Label& wrong_method_type) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2046 |
assert_different_registers(mtype_reg, mh_reg, temp_reg); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2047 |
// Compare method type against that of the receiver. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2048 |
load_heap_oop_not_null(temp_reg, delayed_value(java_lang_invoke_MethodHandle::type_offset_in_bytes, temp_reg), mh_reg); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2049 |
cmpd(CCR0, temp_reg, mtype_reg); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2050 |
bne(CCR0, wrong_method_type); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2051 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2052 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2053 |
RegisterOrConstant MacroAssembler::argument_offset(RegisterOrConstant arg_slot, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2054 |
Register temp_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2055 |
int extra_slot_offset) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2056 |
// cf. TemplateTable::prepare_invoke(), if (load_receiver). |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2057 |
int stackElementSize = Interpreter::stackElementSize; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2058 |
int offset = extra_slot_offset * stackElementSize; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2059 |
if (arg_slot.is_constant()) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2060 |
offset += arg_slot.as_constant() * stackElementSize; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2061 |
return offset; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2062 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2063 |
assert(temp_reg != noreg, "must specify"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2064 |
sldi(temp_reg, arg_slot.as_register(), exact_log2(stackElementSize)); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2065 |
if (offset != 0) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2066 |
addi(temp_reg, temp_reg, offset); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2067 |
return temp_reg; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2068 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2069 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2070 |
|
35085 | 2071 |
// Supports temp2_reg = R0. |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2072 |
void MacroAssembler::biased_locking_enter(ConditionRegister cr_reg, Register obj_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2073 |
Register mark_reg, Register temp_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2074 |
Register temp2_reg, Label& done, Label* slow_case) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2075 |
assert(UseBiasedLocking, "why call this otherwise?"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2076 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2077 |
#ifdef ASSERT |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2078 |
assert_different_registers(obj_reg, mark_reg, temp_reg, temp2_reg); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2079 |
#endif |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2080 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2081 |
Label cas_label; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2082 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2083 |
// Branch to done if fast path fails and no slow_case provided. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2084 |
Label *slow_case_int = (slow_case != NULL) ? slow_case : &done; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2085 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2086 |
// Biased locking |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2087 |
// See whether the lock is currently biased toward our thread and |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2088 |
// whether the epoch is still valid |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2089 |
// Note that the runtime guarantees sufficient alignment of JavaThread |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2090 |
// pointers to allow age to be placed into low bits |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2091 |
assert(markOopDesc::age_shift == markOopDesc::lock_bits + markOopDesc::biased_lock_bits, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2092 |
"biased locking makes assumptions about bit layout"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2093 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2094 |
if (PrintBiasedLockingStatistics) { |
35085 | 2095 |
load_const(temp2_reg, (address) BiasedLocking::total_entry_count_addr(), temp_reg); |
2096 |
lwzx(temp_reg, temp2_reg); |
|
2097 |
addi(temp_reg, temp_reg, 1); |
|
2098 |
stwx(temp_reg, temp2_reg); |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2099 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2100 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2101 |
andi(temp_reg, mark_reg, markOopDesc::biased_lock_mask_in_place); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2102 |
cmpwi(cr_reg, temp_reg, markOopDesc::biased_lock_pattern); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2103 |
bne(cr_reg, cas_label); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2104 |
|
23492 | 2105 |
load_klass(temp_reg, obj_reg); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2106 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2107 |
load_const_optimized(temp2_reg, ~((int) markOopDesc::age_mask_in_place)); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2108 |
ld(temp_reg, in_bytes(Klass::prototype_header_offset()), temp_reg); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2109 |
orr(temp_reg, R16_thread, temp_reg); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2110 |
xorr(temp_reg, mark_reg, temp_reg); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2111 |
andr(temp_reg, temp_reg, temp2_reg); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2112 |
cmpdi(cr_reg, temp_reg, 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2113 |
if (PrintBiasedLockingStatistics) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2114 |
Label l; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2115 |
bne(cr_reg, l); |
35085 | 2116 |
load_const(temp2_reg, (address) BiasedLocking::biased_lock_entry_count_addr()); |
2117 |
lwzx(mark_reg, temp2_reg); |
|
2118 |
addi(mark_reg, mark_reg, 1); |
|
2119 |
stwx(mark_reg, temp2_reg); |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2120 |
// restore mark_reg |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2121 |
ld(mark_reg, oopDesc::mark_offset_in_bytes(), obj_reg); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2122 |
bind(l); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2123 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2124 |
beq(cr_reg, done); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2125 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2126 |
Label try_revoke_bias; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2127 |
Label try_rebias; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2128 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2129 |
// At this point we know that the header has the bias pattern and |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2130 |
// that we are not the bias owner in the current epoch. We need to |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2131 |
// figure out more details about the state of the header in order to |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2132 |
// know what operations can be legally performed on the object's |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2133 |
// header. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2134 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2135 |
// If the low three bits in the xor result aren't clear, that means |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2136 |
// the prototype header is no longer biased and we have to revoke |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2137 |
// the bias on this object. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2138 |
andi(temp2_reg, temp_reg, markOopDesc::biased_lock_mask_in_place); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2139 |
cmpwi(cr_reg, temp2_reg, 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2140 |
bne(cr_reg, try_revoke_bias); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2141 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2142 |
// Biasing is still enabled for this data type. See whether the |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2143 |
// epoch of the current bias is still valid, meaning that the epoch |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2144 |
// bits of the mark word are equal to the epoch bits of the |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2145 |
// prototype header. (Note that the prototype header's epoch bits |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2146 |
// only change at a safepoint.) If not, attempt to rebias the object |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2147 |
// toward the current thread. Note that we must be absolutely sure |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2148 |
// that the current epoch is invalid in order to do this because |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2149 |
// otherwise the manipulations it performs on the mark word are |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2150 |
// illegal. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2151 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2152 |
int shift_amount = 64 - markOopDesc::epoch_shift; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2153 |
// rotate epoch bits to right (little) end and set other bits to 0 |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2154 |
// [ big part | epoch | little part ] -> [ 0..0 | epoch ] |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2155 |
rldicl_(temp2_reg, temp_reg, shift_amount, 64 - markOopDesc::epoch_bits); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2156 |
// branch if epoch bits are != 0, i.e. they differ, because the epoch has been incremented |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2157 |
bne(CCR0, try_rebias); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2158 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2159 |
// The epoch of the current bias is still valid but we know nothing |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2160 |
// about the owner; it might be set or it might be clear. Try to |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2161 |
// acquire the bias of the object using an atomic operation. If this |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2162 |
// fails we will go in to the runtime to revoke the object's bias. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2163 |
// Note that we first construct the presumed unbiased header so we |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2164 |
// don't accidentally blow away another thread's valid bias. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2165 |
andi(mark_reg, mark_reg, (markOopDesc::biased_lock_mask_in_place | |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2166 |
markOopDesc::age_mask_in_place | |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2167 |
markOopDesc::epoch_mask_in_place)); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2168 |
orr(temp_reg, R16_thread, mark_reg); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2169 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2170 |
assert(oopDesc::mark_offset_in_bytes() == 0, "offset of _mark is not 0"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2171 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2172 |
// CmpxchgX sets cr_reg to cmpX(temp2_reg, mark_reg). |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2173 |
cmpxchgd(/*flag=*/cr_reg, /*current_value=*/temp2_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2174 |
/*compare_value=*/mark_reg, /*exchange_value=*/temp_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2175 |
/*where=*/obj_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2176 |
MacroAssembler::MemBarAcq, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2177 |
MacroAssembler::cmpxchgx_hint_acquire_lock(), |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2178 |
noreg, slow_case_int); // bail out if failed |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2179 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2180 |
// If the biasing toward our thread failed, this means that |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2181 |
// another thread succeeded in biasing it toward itself and we |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2182 |
// need to revoke that bias. The revocation will occur in the |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2183 |
// interpreter runtime in the slow case. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2184 |
if (PrintBiasedLockingStatistics) { |
35085 | 2185 |
load_const(temp2_reg, (address) BiasedLocking::anonymously_biased_lock_entry_count_addr(), temp_reg); |
2186 |
lwzx(temp_reg, temp2_reg); |
|
2187 |
addi(temp_reg, temp_reg, 1); |
|
2188 |
stwx(temp_reg, temp2_reg); |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2189 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2190 |
b(done); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2191 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2192 |
bind(try_rebias); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2193 |
// At this point we know the epoch has expired, meaning that the |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2194 |
// current "bias owner", if any, is actually invalid. Under these |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2195 |
// circumstances _only_, we are allowed to use the current header's |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2196 |
// value as the comparison value when doing the cas to acquire the |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2197 |
// bias in the current epoch. In other words, we allow transfer of |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2198 |
// the bias from one thread to another directly in this situation. |
35085 | 2199 |
load_klass(temp_reg, obj_reg); |
2200 |
andi(temp2_reg, mark_reg, markOopDesc::age_mask_in_place); |
|
2201 |
orr(temp2_reg, R16_thread, temp2_reg); |
|
2202 |
ld(temp_reg, in_bytes(Klass::prototype_header_offset()), temp_reg); |
|
2203 |
orr(temp_reg, temp2_reg, temp_reg); |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2204 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2205 |
assert(oopDesc::mark_offset_in_bytes() == 0, "offset of _mark is not 0"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2206 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2207 |
cmpxchgd(/*flag=*/cr_reg, /*current_value=*/temp2_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2208 |
/*compare_value=*/mark_reg, /*exchange_value=*/temp_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2209 |
/*where=*/obj_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2210 |
MacroAssembler::MemBarAcq, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2211 |
MacroAssembler::cmpxchgx_hint_acquire_lock(), |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2212 |
noreg, slow_case_int); // bail out if failed |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2213 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2214 |
// If the biasing toward our thread failed, this means that |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2215 |
// another thread succeeded in biasing it toward itself and we |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2216 |
// need to revoke that bias. The revocation will occur in the |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2217 |
// interpreter runtime in the slow case. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2218 |
if (PrintBiasedLockingStatistics) { |
35085 | 2219 |
load_const(temp2_reg, (address) BiasedLocking::rebiased_lock_entry_count_addr(), temp_reg); |
2220 |
lwzx(temp_reg, temp2_reg); |
|
2221 |
addi(temp_reg, temp_reg, 1); |
|
2222 |
stwx(temp_reg, temp2_reg); |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2223 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2224 |
b(done); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2225 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2226 |
bind(try_revoke_bias); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2227 |
// The prototype mark in the klass doesn't have the bias bit set any |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2228 |
// more, indicating that objects of this data type are not supposed |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2229 |
// to be biased any more. We are going to try to reset the mark of |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2230 |
// this object to the prototype value and fall through to the |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2231 |
// CAS-based locking scheme. Note that if our CAS fails, it means |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2232 |
// that another thread raced us for the privilege of revoking the |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2233 |
// bias of this particular object, so it's okay to continue in the |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2234 |
// normal locking code. |
23492 | 2235 |
load_klass(temp_reg, obj_reg); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2236 |
ld(temp_reg, in_bytes(Klass::prototype_header_offset()), temp_reg); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2237 |
andi(temp2_reg, mark_reg, markOopDesc::age_mask_in_place); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2238 |
orr(temp_reg, temp_reg, temp2_reg); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2239 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2240 |
assert(oopDesc::mark_offset_in_bytes() == 0, "offset of _mark is not 0"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2241 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2242 |
// CmpxchgX sets cr_reg to cmpX(temp2_reg, mark_reg). |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2243 |
cmpxchgd(/*flag=*/cr_reg, /*current_value=*/temp2_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2244 |
/*compare_value=*/mark_reg, /*exchange_value=*/temp_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2245 |
/*where=*/obj_reg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2246 |
MacroAssembler::MemBarAcq, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2247 |
MacroAssembler::cmpxchgx_hint_acquire_lock()); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2248 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2249 |
// reload markOop in mark_reg before continuing with lightweight locking |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2250 |
ld(mark_reg, oopDesc::mark_offset_in_bytes(), obj_reg); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2251 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2252 |
// Fall through to the normal CAS-based lock, because no matter what |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2253 |
// the result of the above CAS, some thread must have succeeded in |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2254 |
// removing the bias bit from the object's header. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2255 |
if (PrintBiasedLockingStatistics) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2256 |
Label l; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2257 |
bne(cr_reg, l); |
35085 | 2258 |
load_const(temp2_reg, (address) BiasedLocking::revoked_lock_entry_count_addr(), temp_reg); |
2259 |
lwzx(temp_reg, temp2_reg); |
|
2260 |
addi(temp_reg, temp_reg, 1); |
|
2261 |
stwx(temp_reg, temp2_reg); |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2262 |
bind(l); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2263 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2264 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2265 |
bind(cas_label); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2266 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2267 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2268 |
void MacroAssembler::biased_locking_exit (ConditionRegister cr_reg, Register mark_addr, Register temp_reg, Label& done) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2269 |
// Check for biased locking unlock case, which is a no-op |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2270 |
// Note: we do not have to check the thread ID for two reasons. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2271 |
// First, the interpreter checks for IllegalMonitorStateException at |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2272 |
// a higher level. Second, if the bias was revoked while we held the |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2273 |
// lock, the object could not be rebiased toward another thread, so |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2274 |
// the bias bit would be clear. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2275 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2276 |
ld(temp_reg, 0, mark_addr); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2277 |
andi(temp_reg, temp_reg, markOopDesc::biased_lock_mask_in_place); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2278 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2279 |
cmpwi(cr_reg, temp_reg, markOopDesc::biased_lock_pattern); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2280 |
beq(cr_reg, done); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2281 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2282 |
|
35085 | 2283 |
// allocation (for C1) |
2284 |
void MacroAssembler::eden_allocate( |
|
2285 |
Register obj, // result: pointer to object after successful allocation |
|
2286 |
Register var_size_in_bytes, // object size in bytes if unknown at compile time; invalid otherwise |
|
2287 |
int con_size_in_bytes, // object size in bytes if known at compile time |
|
2288 |
Register t1, // temp register |
|
2289 |
Register t2, // temp register |
|
2290 |
Label& slow_case // continuation point if fast allocation fails |
|
2291 |
) { |
|
2292 |
b(slow_case); |
|
2293 |
} |
|
2294 |
||
2295 |
void MacroAssembler::tlab_allocate( |
|
2296 |
Register obj, // result: pointer to object after successful allocation |
|
2297 |
Register var_size_in_bytes, // object size in bytes if unknown at compile time; invalid otherwise |
|
2298 |
int con_size_in_bytes, // object size in bytes if known at compile time |
|
2299 |
Register t1, // temp register |
|
2300 |
Label& slow_case // continuation point if fast allocation fails |
|
2301 |
) { |
|
2302 |
// make sure arguments make sense |
|
2303 |
assert_different_registers(obj, var_size_in_bytes, t1); |
|
2304 |
assert(0 <= con_size_in_bytes && is_simm13(con_size_in_bytes), "illegal object size"); |
|
2305 |
assert((con_size_in_bytes & MinObjAlignmentInBytesMask) == 0, "object size is not multiple of alignment"); |
|
2306 |
||
2307 |
const Register new_top = t1; |
|
2308 |
//verify_tlab(); not implemented |
|
2309 |
||
2310 |
ld(obj, in_bytes(JavaThread::tlab_top_offset()), R16_thread); |
|
2311 |
ld(R0, in_bytes(JavaThread::tlab_end_offset()), R16_thread); |
|
2312 |
if (var_size_in_bytes == noreg) { |
|
2313 |
addi(new_top, obj, con_size_in_bytes); |
|
2314 |
} else { |
|
2315 |
add(new_top, obj, var_size_in_bytes); |
|
2316 |
} |
|
2317 |
cmpld(CCR0, new_top, R0); |
|
2318 |
bc_far_optimized(Assembler::bcondCRbiIs1, bi0(CCR0, Assembler::greater), slow_case); |
|
2319 |
||
2320 |
#ifdef ASSERT |
|
2321 |
// make sure new free pointer is properly aligned |
|
2322 |
{ |
|
2323 |
Label L; |
|
2324 |
andi_(R0, new_top, MinObjAlignmentInBytesMask); |
|
2325 |
beq(CCR0, L); |
|
2326 |
stop("updated TLAB free is not properly aligned", 0x934); |
|
2327 |
bind(L); |
|
2328 |
} |
|
2329 |
#endif // ASSERT |
|
2330 |
||
2331 |
// update the tlab top pointer |
|
2332 |
std(new_top, in_bytes(JavaThread::tlab_top_offset()), R16_thread); |
|
2333 |
//verify_tlab(); not implemented |
|
2334 |
} |
|
2335 |
void MacroAssembler::incr_allocated_bytes(RegisterOrConstant size_in_bytes, Register t1, Register t2) { |
|
2336 |
unimplemented("incr_allocated_bytes"); |
|
2337 |
} |
|
2338 |
||
2339 |
address MacroAssembler::emit_trampoline_stub(int destination_toc_offset, |
|
2340 |
int insts_call_instruction_offset, Register Rtoc) { |
|
2341 |
// Start the stub. |
|
2342 |
address stub = start_a_stub(64); |
|
2343 |
if (stub == NULL) { return NULL; } // CodeCache full: bail out |
|
2344 |
||
2345 |
// Create a trampoline stub relocation which relates this trampoline stub |
|
2346 |
// with the call instruction at insts_call_instruction_offset in the |
|
2347 |
// instructions code-section. |
|
2348 |
relocate(trampoline_stub_Relocation::spec(code()->insts()->start() + insts_call_instruction_offset)); |
|
2349 |
const int stub_start_offset = offset(); |
|
2350 |
||
2351 |
// For java_to_interp stubs we use R11_scratch1 as scratch register |
|
2352 |
// and in call trampoline stubs we use R12_scratch2. This way we |
|
2353 |
// can distinguish them (see is_NativeCallTrampolineStub_at()). |
|
2354 |
Register reg_scratch = R12_scratch2; |
|
2355 |
||
2356 |
// Now, create the trampoline stub's code: |
|
2357 |
// - load the TOC |
|
2358 |
// - load the call target from the constant pool |
|
2359 |
// - call |
|
2360 |
if (Rtoc == noreg) { |
|
2361 |
calculate_address_from_global_toc(reg_scratch, method_toc()); |
|
2362 |
Rtoc = reg_scratch; |
|
2363 |
} |
|
2364 |
||
2365 |
ld_largeoffset_unchecked(reg_scratch, destination_toc_offset, Rtoc, false); |
|
2366 |
mtctr(reg_scratch); |
|
2367 |
bctr(); |
|
2368 |
||
2369 |
const address stub_start_addr = addr_at(stub_start_offset); |
|
2370 |
||
2371 |
// Assert that the encoded destination_toc_offset can be identified and that it is correct. |
|
2372 |
assert(destination_toc_offset == NativeCallTrampolineStub_at(stub_start_addr)->destination_toc_offset(), |
|
2373 |
"encoded offset into the constant pool must match"); |
|
2374 |
// Trampoline_stub_size should be good. |
|
2375 |
assert((uint)(offset() - stub_start_offset) <= trampoline_stub_size, "should be good size"); |
|
2376 |
assert(is_NativeCallTrampolineStub_at(stub_start_addr), "doesn't look like a trampoline"); |
|
2377 |
||
2378 |
// End the stub. |
|
2379 |
end_a_stub(); |
|
2380 |
return stub; |
|
2381 |
} |
|
2382 |
||
30303 | 2383 |
// TM on PPC64. |
2384 |
void MacroAssembler::atomic_inc_ptr(Register addr, Register result, int simm16) { |
|
2385 |
Label retry; |
|
2386 |
bind(retry); |
|
2387 |
ldarx(result, addr, /*hint*/ false); |
|
2388 |
addi(result, result, simm16); |
|
2389 |
stdcx_(result, addr); |
|
2390 |
if (UseStaticBranchPredictionInCompareAndSwapPPC64) { |
|
2391 |
bne_predict_not_taken(CCR0, retry); // stXcx_ sets CCR0 |
|
2392 |
} else { |
|
2393 |
bne( CCR0, retry); // stXcx_ sets CCR0 |
|
2394 |
} |
|
2395 |
} |
|
2396 |
||
2397 |
void MacroAssembler::atomic_ori_int(Register addr, Register result, int uimm16) { |
|
2398 |
Label retry; |
|
2399 |
bind(retry); |
|
2400 |
lwarx(result, addr, /*hint*/ false); |
|
2401 |
ori(result, result, uimm16); |
|
2402 |
stwcx_(result, addr); |
|
2403 |
if (UseStaticBranchPredictionInCompareAndSwapPPC64) { |
|
2404 |
bne_predict_not_taken(CCR0, retry); // stXcx_ sets CCR0 |
|
2405 |
} else { |
|
2406 |
bne( CCR0, retry); // stXcx_ sets CCR0 |
|
2407 |
} |
|
2408 |
} |
|
2409 |
||
2410 |
#if INCLUDE_RTM_OPT |
|
2411 |
||
2412 |
// Update rtm_counters based on abort status |
|
2413 |
// input: abort_status |
|
2414 |
// rtm_counters (RTMLockingCounters*) |
|
2415 |
void MacroAssembler::rtm_counters_update(Register abort_status, Register rtm_counters_Reg) { |
|
2416 |
// Mapping to keep PreciseRTMLockingStatistics similar to x86. |
|
2417 |
// x86 ppc (! means inverted, ? means not the same) |
|
2418 |
// 0 31 Set if abort caused by XABORT instruction. |
|
2419 |
// 1 ! 7 If set, the transaction may succeed on a retry. This bit is always clear if bit 0 is set. |
|
2420 |
// 2 13 Set if another logical processor conflicted with a memory address that was part of the transaction that aborted. |
|
2421 |
// 3 10 Set if an internal buffer overflowed. |
|
2422 |
// 4 ?12 Set if a debug breakpoint was hit. |
|
2423 |
// 5 ?32 Set if an abort occurred during execution of a nested transaction. |
|
2424 |
const int tm_failure_bit[] = {Assembler::tm_tabort, // Note: Seems like signal handler sets this, too. |
|
2425 |
Assembler::tm_failure_persistent, // inverted: transient |
|
2426 |
Assembler::tm_trans_cf, |
|
2427 |
Assembler::tm_footprint_of, |
|
2428 |
Assembler::tm_non_trans_cf, |
|
2429 |
Assembler::tm_suspended}; |
|
2430 |
const bool tm_failure_inv[] = {false, true, false, false, false, false}; |
|
2431 |
assert(sizeof(tm_failure_bit)/sizeof(int) == RTMLockingCounters::ABORT_STATUS_LIMIT, "adapt mapping!"); |
|
2432 |
||
2433 |
const Register addr_Reg = R0; |
|
2434 |
// Keep track of offset to where rtm_counters_Reg had pointed to. |
|
2435 |
int counters_offs = RTMLockingCounters::abort_count_offset(); |
|
2436 |
addi(addr_Reg, rtm_counters_Reg, counters_offs); |
|
2437 |
const Register temp_Reg = rtm_counters_Reg; |
|
2438 |
||
2439 |
//atomic_inc_ptr(addr_Reg, temp_Reg); We don't increment atomically |
|
2440 |
ldx(temp_Reg, addr_Reg); |
|
2441 |
addi(temp_Reg, temp_Reg, 1); |
|
2442 |
stdx(temp_Reg, addr_Reg); |
|
2443 |
||
2444 |
if (PrintPreciseRTMLockingStatistics) { |
|
2445 |
int counters_offs_delta = RTMLockingCounters::abortX_count_offset() - counters_offs; |
|
2446 |
||
2447 |
//mftexasr(abort_status); done by caller |
|
2448 |
for (int i = 0; i < RTMLockingCounters::ABORT_STATUS_LIMIT; i++) { |
|
2449 |
counters_offs += counters_offs_delta; |
|
2450 |
li(temp_Reg, counters_offs_delta); // can't use addi with R0 |
|
2451 |
add(addr_Reg, addr_Reg, temp_Reg); // point to next counter |
|
2452 |
counters_offs_delta = sizeof(uintx); |
|
2453 |
||
2454 |
Label check_abort; |
|
2455 |
rldicr_(temp_Reg, abort_status, tm_failure_bit[i], 0); |
|
2456 |
if (tm_failure_inv[i]) { |
|
2457 |
bne(CCR0, check_abort); |
|
2458 |
} else { |
|
2459 |
beq(CCR0, check_abort); |
|
2460 |
} |
|
2461 |
//atomic_inc_ptr(addr_Reg, temp_Reg); We don't increment atomically |
|
2462 |
ldx(temp_Reg, addr_Reg); |
|
2463 |
addi(temp_Reg, temp_Reg, 1); |
|
2464 |
stdx(temp_Reg, addr_Reg); |
|
2465 |
bind(check_abort); |
|
2466 |
} |
|
2467 |
} |
|
2468 |
li(temp_Reg, -counters_offs); // can't use addi with R0 |
|
2469 |
add(rtm_counters_Reg, addr_Reg, temp_Reg); // restore |
|
2470 |
} |
|
2471 |
||
2472 |
// Branch if (random & (count-1) != 0), count is 2^n |
|
2473 |
// tmp and CR0 are killed |
|
2474 |
void MacroAssembler::branch_on_random_using_tb(Register tmp, int count, Label& brLabel) { |
|
2475 |
mftb(tmp); |
|
2476 |
andi_(tmp, tmp, count-1); |
|
2477 |
bne(CCR0, brLabel); |
|
2478 |
} |
|
2479 |
||
2480 |
// Perform abort ratio calculation, set no_rtm bit if high ratio. |
|
2481 |
// input: rtm_counters_Reg (RTMLockingCounters* address) - KILLED |
|
2482 |
void MacroAssembler::rtm_abort_ratio_calculation(Register rtm_counters_Reg, |
|
2483 |
RTMLockingCounters* rtm_counters, |
|
2484 |
Metadata* method_data) { |
|
2485 |
Label L_done, L_check_always_rtm1, L_check_always_rtm2; |
|
2486 |
||
2487 |
if (RTMLockingCalculationDelay > 0) { |
|
2488 |
// Delay calculation. |
|
2489 |
ld(rtm_counters_Reg, (RegisterOrConstant)(intptr_t)RTMLockingCounters::rtm_calculation_flag_addr()); |
|
2490 |
cmpdi(CCR0, rtm_counters_Reg, 0); |
|
2491 |
beq(CCR0, L_done); |
|
2492 |
load_const_optimized(rtm_counters_Reg, (address)rtm_counters, R0); // reload |
|
2493 |
} |
|
2494 |
// Abort ratio calculation only if abort_count > RTMAbortThreshold. |
|
2495 |
// Aborted transactions = abort_count * 100 |
|
2496 |
// All transactions = total_count * RTMTotalCountIncrRate |
|
2497 |
// Set no_rtm bit if (Aborted transactions >= All transactions * RTMAbortRatio) |
|
2498 |
ld(R0, RTMLockingCounters::abort_count_offset(), rtm_counters_Reg); |
|
46494
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2499 |
if (is_simm(RTMAbortThreshold, 16)) { // cmpdi can handle 16bit immediate only. |
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2500 |
cmpdi(CCR0, R0, RTMAbortThreshold); |
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2501 |
blt(CCR0, L_check_always_rtm2); // reload of rtm_counters_Reg not necessary |
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2502 |
} else { |
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2503 |
load_const_optimized(rtm_counters_Reg, RTMAbortThreshold); |
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2504 |
cmpd(CCR0, R0, rtm_counters_Reg); |
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2505 |
blt(CCR0, L_check_always_rtm1); // reload of rtm_counters_Reg required |
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2506 |
} |
30303 | 2507 |
mulli(R0, R0, 100); |
2508 |
||
2509 |
const Register tmpReg = rtm_counters_Reg; |
|
2510 |
ld(tmpReg, RTMLockingCounters::total_count_offset(), rtm_counters_Reg); |
|
46494
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2511 |
mulli(tmpReg, tmpReg, RTMTotalCountIncrRate); // allowable range: int16 |
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2512 |
mulli(tmpReg, tmpReg, RTMAbortRatio); // allowable range: int16 |
30303 | 2513 |
cmpd(CCR0, R0, tmpReg); |
2514 |
blt(CCR0, L_check_always_rtm1); // jump to reload |
|
2515 |
if (method_data != NULL) { |
|
2516 |
// Set rtm_state to "no rtm" in MDO. |
|
2517 |
// Not using a metadata relocation. Method and Class Loader are kept alive anyway. |
|
2518 |
// (See nmethod::metadata_do and CodeBuffer::finalize_oop_references.) |
|
2519 |
load_const(R0, (address)method_data + MethodData::rtm_state_offset_in_bytes(), tmpReg); |
|
2520 |
atomic_ori_int(R0, tmpReg, NoRTM); |
|
2521 |
} |
|
2522 |
b(L_done); |
|
2523 |
||
2524 |
bind(L_check_always_rtm1); |
|
2525 |
load_const_optimized(rtm_counters_Reg, (address)rtm_counters, R0); // reload |
|
2526 |
bind(L_check_always_rtm2); |
|
2527 |
ld(tmpReg, RTMLockingCounters::total_count_offset(), rtm_counters_Reg); |
|
46494
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2528 |
int64_t thresholdValue = RTMLockingThreshold / RTMTotalCountIncrRate; |
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2529 |
if (is_simm(thresholdValue, 16)) { // cmpdi can handle 16bit immediate only. |
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2530 |
cmpdi(CCR0, tmpReg, thresholdValue); |
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2531 |
} else { |
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2532 |
load_const_optimized(R0, thresholdValue); |
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2533 |
cmpd(CCR0, tmpReg, R0); |
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2534 |
} |
30303 | 2535 |
blt(CCR0, L_done); |
2536 |
if (method_data != NULL) { |
|
2537 |
// Set rtm_state to "always rtm" in MDO. |
|
2538 |
// Not using a metadata relocation. See above. |
|
2539 |
load_const(R0, (address)method_data + MethodData::rtm_state_offset_in_bytes(), tmpReg); |
|
2540 |
atomic_ori_int(R0, tmpReg, UseRTM); |
|
2541 |
} |
|
2542 |
bind(L_done); |
|
2543 |
} |
|
2544 |
||
2545 |
// Update counters and perform abort ratio calculation. |
|
2546 |
// input: abort_status_Reg |
|
2547 |
void MacroAssembler::rtm_profiling(Register abort_status_Reg, Register temp_Reg, |
|
2548 |
RTMLockingCounters* rtm_counters, |
|
2549 |
Metadata* method_data, |
|
2550 |
bool profile_rtm) { |
|
2551 |
||
2552 |
assert(rtm_counters != NULL, "should not be NULL when profiling RTM"); |
|
2553 |
// Update rtm counters based on state at abort. |
|
2554 |
// Reads abort_status_Reg, updates flags. |
|
2555 |
assert_different_registers(abort_status_Reg, temp_Reg); |
|
2556 |
load_const_optimized(temp_Reg, (address)rtm_counters, R0); |
|
2557 |
rtm_counters_update(abort_status_Reg, temp_Reg); |
|
2558 |
if (profile_rtm) { |
|
2559 |
assert(rtm_counters != NULL, "should not be NULL when profiling RTM"); |
|
2560 |
rtm_abort_ratio_calculation(temp_Reg, rtm_counters, method_data); |
|
2561 |
} |
|
2562 |
} |
|
2563 |
||
2564 |
// Retry on abort if abort's status indicates non-persistent failure. |
|
2565 |
// inputs: retry_count_Reg |
|
2566 |
// : abort_status_Reg |
|
2567 |
// output: retry_count_Reg decremented by 1 |
|
2568 |
void MacroAssembler::rtm_retry_lock_on_abort(Register retry_count_Reg, Register abort_status_Reg, |
|
2569 |
Label& retryLabel, Label* checkRetry) { |
|
2570 |
Label doneRetry; |
|
2571 |
rldicr_(R0, abort_status_Reg, tm_failure_persistent, 0); |
|
2572 |
bne(CCR0, doneRetry); |
|
2573 |
if (checkRetry) { bind(*checkRetry); } |
|
2574 |
addic_(retry_count_Reg, retry_count_Reg, -1); |
|
2575 |
blt(CCR0, doneRetry); |
|
2576 |
b(retryLabel); |
|
2577 |
bind(doneRetry); |
|
2578 |
} |
|
2579 |
||
2580 |
// Spin and retry if lock is busy. |
|
43428
3dccc891c216
8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents:
42661
diff
changeset
|
2581 |
// inputs: owner_addr_Reg (monitor address) |
30303 | 2582 |
// : retry_count_Reg |
2583 |
// output: retry_count_Reg decremented by 1 |
|
2584 |
// CTR is killed |
|
2585 |
void MacroAssembler::rtm_retry_lock_on_busy(Register retry_count_Reg, Register owner_addr_Reg, Label& retryLabel) { |
|
49728
a1617a75c231
8201218: PPC64: Avoid use of yield instruction on spinlock
gromero
parents:
49455
diff
changeset
|
2586 |
Label SpinLoop, doneRetry, doRetry; |
30303 | 2587 |
addic_(retry_count_Reg, retry_count_Reg, -1); |
2588 |
blt(CCR0, doneRetry); |
|
43428
3dccc891c216
8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents:
42661
diff
changeset
|
2589 |
|
3dccc891c216
8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents:
42661
diff
changeset
|
2590 |
if (RTMSpinLoopCount > 1) { |
3dccc891c216
8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents:
42661
diff
changeset
|
2591 |
li(R0, RTMSpinLoopCount); |
3dccc891c216
8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents:
42661
diff
changeset
|
2592 |
mtctr(R0); |
3dccc891c216
8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents:
42661
diff
changeset
|
2593 |
} |
30303 | 2594 |
|
49728
a1617a75c231
8201218: PPC64: Avoid use of yield instruction on spinlock
gromero
parents:
49455
diff
changeset
|
2595 |
// low thread priority |
a1617a75c231
8201218: PPC64: Avoid use of yield instruction on spinlock
gromero
parents:
49455
diff
changeset
|
2596 |
smt_prio_low(); |
30303 | 2597 |
bind(SpinLoop); |
43428
3dccc891c216
8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents:
42661
diff
changeset
|
2598 |
|
3dccc891c216
8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents:
42661
diff
changeset
|
2599 |
if (RTMSpinLoopCount > 1) { |
49728
a1617a75c231
8201218: PPC64: Avoid use of yield instruction on spinlock
gromero
parents:
49455
diff
changeset
|
2600 |
bdz(doRetry); |
43428
3dccc891c216
8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents:
42661
diff
changeset
|
2601 |
ld(R0, 0, owner_addr_Reg); |
3dccc891c216
8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents:
42661
diff
changeset
|
2602 |
cmpdi(CCR0, R0, 0); |
3dccc891c216
8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents:
42661
diff
changeset
|
2603 |
bne(CCR0, SpinLoop); |
3dccc891c216
8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents:
42661
diff
changeset
|
2604 |
} |
3dccc891c216
8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents:
42661
diff
changeset
|
2605 |
|
49728
a1617a75c231
8201218: PPC64: Avoid use of yield instruction on spinlock
gromero
parents:
49455
diff
changeset
|
2606 |
bind(doRetry); |
a1617a75c231
8201218: PPC64: Avoid use of yield instruction on spinlock
gromero
parents:
49455
diff
changeset
|
2607 |
|
a1617a75c231
8201218: PPC64: Avoid use of yield instruction on spinlock
gromero
parents:
49455
diff
changeset
|
2608 |
// restore thread priority to default in userspace |
a1617a75c231
8201218: PPC64: Avoid use of yield instruction on spinlock
gromero
parents:
49455
diff
changeset
|
2609 |
#ifdef LINUX |
a1617a75c231
8201218: PPC64: Avoid use of yield instruction on spinlock
gromero
parents:
49455
diff
changeset
|
2610 |
smt_prio_medium_low(); |
a1617a75c231
8201218: PPC64: Avoid use of yield instruction on spinlock
gromero
parents:
49455
diff
changeset
|
2611 |
#else |
a1617a75c231
8201218: PPC64: Avoid use of yield instruction on spinlock
gromero
parents:
49455
diff
changeset
|
2612 |
smt_prio_medium(); |
a1617a75c231
8201218: PPC64: Avoid use of yield instruction on spinlock
gromero
parents:
49455
diff
changeset
|
2613 |
#endif |
a1617a75c231
8201218: PPC64: Avoid use of yield instruction on spinlock
gromero
parents:
49455
diff
changeset
|
2614 |
|
30303 | 2615 |
b(retryLabel); |
2616 |
||
2617 |
bind(doneRetry); |
|
2618 |
} |
|
2619 |
||
2620 |
// Use RTM for normal stack locks. |
|
2621 |
// Input: objReg (object to lock) |
|
2622 |
void MacroAssembler::rtm_stack_locking(ConditionRegister flag, |
|
2623 |
Register obj, Register mark_word, Register tmp, |
|
2624 |
Register retry_on_abort_count_Reg, |
|
2625 |
RTMLockingCounters* stack_rtm_counters, |
|
2626 |
Metadata* method_data, bool profile_rtm, |
|
2627 |
Label& DONE_LABEL, Label& IsInflated) { |
|
2628 |
assert(UseRTMForStackLocks, "why call this otherwise?"); |
|
2629 |
assert(!UseBiasedLocking, "Biased locking is not supported with RTM locking"); |
|
2630 |
Label L_rtm_retry, L_decrement_retry, L_on_abort; |
|
2631 |
||
2632 |
if (RTMRetryCount > 0) { |
|
2633 |
load_const_optimized(retry_on_abort_count_Reg, RTMRetryCount); // Retry on abort |
|
2634 |
bind(L_rtm_retry); |
|
2635 |
} |
|
2636 |
andi_(R0, mark_word, markOopDesc::monitor_value); // inflated vs stack-locked|neutral|biased |
|
2637 |
bne(CCR0, IsInflated); |
|
2638 |
||
2639 |
if (PrintPreciseRTMLockingStatistics || profile_rtm) { |
|
2640 |
Label L_noincrement; |
|
2641 |
if (RTMTotalCountIncrRate > 1) { |
|
46494
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2642 |
branch_on_random_using_tb(tmp, RTMTotalCountIncrRate, L_noincrement); |
30303 | 2643 |
} |
2644 |
assert(stack_rtm_counters != NULL, "should not be NULL when profiling RTM"); |
|
2645 |
load_const_optimized(tmp, (address)stack_rtm_counters->total_count_addr(), R0); |
|
2646 |
//atomic_inc_ptr(tmp, /*temp, will be reloaded*/mark_word); We don't increment atomically |
|
2647 |
ldx(mark_word, tmp); |
|
2648 |
addi(mark_word, mark_word, 1); |
|
2649 |
stdx(mark_word, tmp); |
|
2650 |
bind(L_noincrement); |
|
2651 |
} |
|
2652 |
tbegin_(); |
|
2653 |
beq(CCR0, L_on_abort); |
|
2654 |
ld(mark_word, oopDesc::mark_offset_in_bytes(), obj); // Reload in transaction, conflicts need to be tracked. |
|
2655 |
andi(R0, mark_word, markOopDesc::biased_lock_mask_in_place); // look at 3 lock bits |
|
2656 |
cmpwi(flag, R0, markOopDesc::unlocked_value); // bits = 001 unlocked |
|
2657 |
beq(flag, DONE_LABEL); // all done if unlocked |
|
2658 |
||
2659 |
if (UseRTMXendForLockBusy) { |
|
2660 |
tend_(); |
|
2661 |
b(L_decrement_retry); |
|
2662 |
} else { |
|
2663 |
tabort_(); |
|
2664 |
} |
|
2665 |
bind(L_on_abort); |
|
2666 |
const Register abort_status_Reg = tmp; |
|
2667 |
mftexasr(abort_status_Reg); |
|
2668 |
if (PrintPreciseRTMLockingStatistics || profile_rtm) { |
|
2669 |
rtm_profiling(abort_status_Reg, /*temp*/mark_word, stack_rtm_counters, method_data, profile_rtm); |
|
2670 |
} |
|
2671 |
ld(mark_word, oopDesc::mark_offset_in_bytes(), obj); // reload |
|
2672 |
if (RTMRetryCount > 0) { |
|
2673 |
// Retry on lock abort if abort status is not permanent. |
|
2674 |
rtm_retry_lock_on_abort(retry_on_abort_count_Reg, abort_status_Reg, L_rtm_retry, &L_decrement_retry); |
|
2675 |
} else { |
|
2676 |
bind(L_decrement_retry); |
|
2677 |
} |
|
2678 |
} |
|
2679 |
||
2680 |
// Use RTM for inflating locks |
|
2681 |
// inputs: obj (object to lock) |
|
2682 |
// mark_word (current header - KILLED) |
|
2683 |
// boxReg (on-stack box address (displaced header location) - KILLED) |
|
2684 |
void MacroAssembler::rtm_inflated_locking(ConditionRegister flag, |
|
2685 |
Register obj, Register mark_word, Register boxReg, |
|
2686 |
Register retry_on_busy_count_Reg, Register retry_on_abort_count_Reg, |
|
2687 |
RTMLockingCounters* rtm_counters, |
|
2688 |
Metadata* method_data, bool profile_rtm, |
|
2689 |
Label& DONE_LABEL) { |
|
2690 |
assert(UseRTMLocking, "why call this otherwise?"); |
|
2691 |
Label L_rtm_retry, L_decrement_retry, L_on_abort; |
|
2692 |
// Clean monitor_value bit to get valid pointer. |
|
2693 |
int owner_offset = ObjectMonitor::owner_offset_in_bytes() - markOopDesc::monitor_value; |
|
2694 |
||
2695 |
// Store non-null, using boxReg instead of (intptr_t)markOopDesc::unused_mark(). |
|
2696 |
std(boxReg, BasicLock::displaced_header_offset_in_bytes(), boxReg); |
|
2697 |
const Register tmpReg = boxReg; |
|
2698 |
const Register owner_addr_Reg = mark_word; |
|
2699 |
addi(owner_addr_Reg, mark_word, owner_offset); |
|
2700 |
||
2701 |
if (RTMRetryCount > 0) { |
|
2702 |
load_const_optimized(retry_on_busy_count_Reg, RTMRetryCount); // Retry on lock busy. |
|
2703 |
load_const_optimized(retry_on_abort_count_Reg, RTMRetryCount); // Retry on abort. |
|
2704 |
bind(L_rtm_retry); |
|
2705 |
} |
|
2706 |
if (PrintPreciseRTMLockingStatistics || profile_rtm) { |
|
2707 |
Label L_noincrement; |
|
2708 |
if (RTMTotalCountIncrRate > 1) { |
|
46494
3fdd343bc5ea
8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents:
46369
diff
changeset
|
2709 |
branch_on_random_using_tb(R0, RTMTotalCountIncrRate, L_noincrement); |
30303 | 2710 |
} |
2711 |
assert(rtm_counters != NULL, "should not be NULL when profiling RTM"); |
|
2712 |
load_const(R0, (address)rtm_counters->total_count_addr(), tmpReg); |
|
2713 |
//atomic_inc_ptr(R0, tmpReg); We don't increment atomically |
|
2714 |
ldx(tmpReg, R0); |
|
2715 |
addi(tmpReg, tmpReg, 1); |
|
2716 |
stdx(tmpReg, R0); |
|
2717 |
bind(L_noincrement); |
|
2718 |
} |
|
2719 |
tbegin_(); |
|
2720 |
beq(CCR0, L_on_abort); |
|
2721 |
// We don't reload mark word. Will only be reset at safepoint. |
|
2722 |
ld(R0, 0, owner_addr_Reg); // Load in transaction, conflicts need to be tracked. |
|
2723 |
cmpdi(flag, R0, 0); |
|
2724 |
beq(flag, DONE_LABEL); |
|
2725 |
||
2726 |
if (UseRTMXendForLockBusy) { |
|
2727 |
tend_(); |
|
2728 |
b(L_decrement_retry); |
|
2729 |
} else { |
|
2730 |
tabort_(); |
|
2731 |
} |
|
2732 |
bind(L_on_abort); |
|
2733 |
const Register abort_status_Reg = tmpReg; |
|
2734 |
mftexasr(abort_status_Reg); |
|
2735 |
if (PrintPreciseRTMLockingStatistics || profile_rtm) { |
|
2736 |
rtm_profiling(abort_status_Reg, /*temp*/ owner_addr_Reg, rtm_counters, method_data, profile_rtm); |
|
2737 |
// Restore owner_addr_Reg |
|
2738 |
ld(mark_word, oopDesc::mark_offset_in_bytes(), obj); |
|
2739 |
#ifdef ASSERT |
|
2740 |
andi_(R0, mark_word, markOopDesc::monitor_value); |
|
2741 |
asm_assert_ne("must be inflated", 0xa754); // Deflating only allowed at safepoint. |
|
2742 |
#endif |
|
2743 |
addi(owner_addr_Reg, mark_word, owner_offset); |
|
2744 |
} |
|
2745 |
if (RTMRetryCount > 0) { |
|
2746 |
// Retry on lock abort if abort status is not permanent. |
|
2747 |
rtm_retry_lock_on_abort(retry_on_abort_count_Reg, abort_status_Reg, L_rtm_retry); |
|
2748 |
} |
|
2749 |
||
2750 |
// Appears unlocked - try to swing _owner from null to non-null. |
|
2751 |
cmpxchgd(flag, /*current val*/ R0, (intptr_t)0, /*new val*/ R16_thread, owner_addr_Reg, |
|
2752 |
MacroAssembler::MemBarRel | MacroAssembler::MemBarAcq, |
|
2753 |
MacroAssembler::cmpxchgx_hint_acquire_lock(), noreg, &L_decrement_retry, true); |
|
2754 |
||
2755 |
if (RTMRetryCount > 0) { |
|
2756 |
// success done else retry |
|
2757 |
b(DONE_LABEL); |
|
2758 |
bind(L_decrement_retry); |
|
2759 |
// Spin and retry if lock is busy. |
|
2760 |
rtm_retry_lock_on_busy(retry_on_busy_count_Reg, owner_addr_Reg, L_rtm_retry); |
|
2761 |
} else { |
|
2762 |
bind(L_decrement_retry); |
|
2763 |
} |
|
2764 |
} |
|
2765 |
||
2766 |
#endif // INCLUDE_RTM_OPT |
|
2767 |
||
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2768 |
// "The box" is the space on the stack where we copy the object mark. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2769 |
void MacroAssembler::compiler_fast_lock_object(ConditionRegister flag, Register oop, Register box, |
30303 | 2770 |
Register temp, Register displaced_header, Register current_header, |
2771 |
bool try_bias, |
|
2772 |
RTMLockingCounters* rtm_counters, |
|
2773 |
RTMLockingCounters* stack_rtm_counters, |
|
2774 |
Metadata* method_data, |
|
2775 |
bool use_rtm, bool profile_rtm) { |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2776 |
assert_different_registers(oop, box, temp, displaced_header, current_header); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2777 |
assert(flag != CCR0, "bad condition register"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2778 |
Label cont; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2779 |
Label object_has_monitor; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2780 |
Label cas_failed; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2781 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2782 |
// Load markOop from object into displaced_header. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2783 |
ld(displaced_header, oopDesc::mark_offset_in_bytes(), oop); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2784 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2785 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2786 |
// Always do locking in runtime. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2787 |
if (EmitSync & 0x01) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2788 |
cmpdi(flag, oop, 0); // Oop can't be 0 here => always false. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2789 |
return; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2790 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2791 |
|
30303 | 2792 |
if (try_bias) { |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2793 |
biased_locking_enter(flag, oop, displaced_header, temp, current_header, cont); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2794 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2795 |
|
30303 | 2796 |
#if INCLUDE_RTM_OPT |
2797 |
if (UseRTMForStackLocks && use_rtm) { |
|
2798 |
rtm_stack_locking(flag, oop, displaced_header, temp, /*temp*/ current_header, |
|
2799 |
stack_rtm_counters, method_data, profile_rtm, |
|
2800 |
cont, object_has_monitor); |
|
2801 |
} |
|
2802 |
#endif // INCLUDE_RTM_OPT |
|
2803 |
||
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2804 |
// Handle existing monitor. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2805 |
if ((EmitSync & 0x02) == 0) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2806 |
// The object has an existing monitor iff (mark & monitor_value) != 0. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2807 |
andi_(temp, displaced_header, markOopDesc::monitor_value); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2808 |
bne(CCR0, object_has_monitor); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2809 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2810 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2811 |
// Set displaced_header to be (markOop of object | UNLOCK_VALUE). |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2812 |
ori(displaced_header, displaced_header, markOopDesc::unlocked_value); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2813 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2814 |
// Load Compare Value application register. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2815 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2816 |
// Initialize the box. (Must happen before we update the object mark!) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2817 |
std(displaced_header, BasicLock::displaced_header_offset_in_bytes(), box); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2818 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2819 |
// Must fence, otherwise, preceding store(s) may float below cmpxchg. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2820 |
// Compare object markOop with mark and if equal exchange scratch1 with object markOop. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2821 |
cmpxchgd(/*flag=*/flag, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2822 |
/*current_value=*/current_header, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2823 |
/*compare_value=*/displaced_header, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2824 |
/*exchange_value=*/box, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2825 |
/*where=*/oop, |
35085 | 2826 |
MacroAssembler::MemBarRel | MacroAssembler::MemBarAcq, |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2827 |
MacroAssembler::cmpxchgx_hint_acquire_lock(), |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2828 |
noreg, |
35085 | 2829 |
&cas_failed, |
2830 |
/*check without membar and ldarx first*/true); |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2831 |
assert(oopDesc::mark_offset_in_bytes() == 0, "offset of _mark is not 0"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2832 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2833 |
// If the compare-and-exchange succeeded, then we found an unlocked |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2834 |
// object and we have now locked it. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2835 |
b(cont); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2836 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2837 |
bind(cas_failed); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2838 |
// We did not see an unlocked object so try the fast recursive case. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2839 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2840 |
// Check if the owner is self by comparing the value in the markOop of object |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2841 |
// (current_header) with the stack pointer. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2842 |
sub(current_header, current_header, R1_SP); |
35085 | 2843 |
load_const_optimized(temp, ~(os::vm_page_size()-1) | markOopDesc::lock_mask_in_place); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2844 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2845 |
and_(R0/*==0?*/, current_header, temp); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2846 |
// If condition is true we are cont and hence we can store 0 as the |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2847 |
// displaced header in the box, which indicates that it is a recursive lock. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2848 |
mcrf(flag,CCR0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2849 |
std(R0/*==0, perhaps*/, BasicLock::displaced_header_offset_in_bytes(), box); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2850 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2851 |
// Handle existing monitor. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2852 |
if ((EmitSync & 0x02) == 0) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2853 |
b(cont); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2854 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2855 |
bind(object_has_monitor); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2856 |
// The object's monitor m is unlocked iff m->owner == NULL, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2857 |
// otherwise m->owner may contain a thread or a stack address. |
30303 | 2858 |
|
2859 |
#if INCLUDE_RTM_OPT |
|
2860 |
// Use the same RTM locking code in 32- and 64-bit VM. |
|
2861 |
if (use_rtm) { |
|
2862 |
rtm_inflated_locking(flag, oop, displaced_header, box, temp, /*temp*/ current_header, |
|
2863 |
rtm_counters, method_data, profile_rtm, cont); |
|
2864 |
} else { |
|
2865 |
#endif // INCLUDE_RTM_OPT |
|
2866 |
||
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2867 |
// Try to CAS m->owner from NULL to current thread. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2868 |
addi(temp, displaced_header, ObjectMonitor::owner_offset_in_bytes()-markOopDesc::monitor_value); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2869 |
cmpxchgd(/*flag=*/flag, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2870 |
/*current_value=*/current_header, |
30303 | 2871 |
/*compare_value=*/(intptr_t)0, |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2872 |
/*exchange_value=*/R16_thread, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2873 |
/*where=*/temp, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2874 |
MacroAssembler::MemBarRel | MacroAssembler::MemBarAcq, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2875 |
MacroAssembler::cmpxchgx_hint_acquire_lock()); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2876 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2877 |
// Store a non-null value into the box. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2878 |
std(box, BasicLock::displaced_header_offset_in_bytes(), box); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2879 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2880 |
# ifdef ASSERT |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2881 |
bne(flag, cont); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2882 |
// We have acquired the monitor, check some invariants. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2883 |
addi(/*monitor=*/temp, temp, -ObjectMonitor::owner_offset_in_bytes()); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2884 |
// Invariant 1: _recursions should be 0. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2885 |
//assert(ObjectMonitor::recursions_size_in_bytes() == 8, "unexpected size"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2886 |
asm_assert_mem8_is_zero(ObjectMonitor::recursions_offset_in_bytes(), temp, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2887 |
"monitor->_recursions should be 0", -1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2888 |
# endif |
30303 | 2889 |
|
2890 |
#if INCLUDE_RTM_OPT |
|
2891 |
} // use_rtm() |
|
2892 |
#endif |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2893 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2894 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2895 |
bind(cont); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2896 |
// flag == EQ indicates success |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2897 |
// flag == NE indicates failure |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2898 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2899 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2900 |
void MacroAssembler::compiler_fast_unlock_object(ConditionRegister flag, Register oop, Register box, |
30303 | 2901 |
Register temp, Register displaced_header, Register current_header, |
2902 |
bool try_bias, bool use_rtm) { |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2903 |
assert_different_registers(oop, box, temp, displaced_header, current_header); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2904 |
assert(flag != CCR0, "bad condition register"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2905 |
Label cont; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2906 |
Label object_has_monitor; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2907 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2908 |
// Always do locking in runtime. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2909 |
if (EmitSync & 0x01) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2910 |
cmpdi(flag, oop, 0); // Oop can't be 0 here => always false. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2911 |
return; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2912 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2913 |
|
30303 | 2914 |
if (try_bias) { |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2915 |
biased_locking_exit(flag, oop, current_header, cont); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2916 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2917 |
|
30303 | 2918 |
#if INCLUDE_RTM_OPT |
2919 |
if (UseRTMForStackLocks && use_rtm) { |
|
2920 |
assert(!UseBiasedLocking, "Biased locking is not supported with RTM locking"); |
|
2921 |
Label L_regular_unlock; |
|
2922 |
ld(current_header, oopDesc::mark_offset_in_bytes(), oop); // fetch markword |
|
2923 |
andi(R0, current_header, markOopDesc::biased_lock_mask_in_place); // look at 3 lock bits |
|
2924 |
cmpwi(flag, R0, markOopDesc::unlocked_value); // bits = 001 unlocked |
|
2925 |
bne(flag, L_regular_unlock); // else RegularLock |
|
2926 |
tend_(); // otherwise end... |
|
2927 |
b(cont); // ... and we're done |
|
2928 |
bind(L_regular_unlock); |
|
2929 |
} |
|
2930 |
#endif |
|
2931 |
||
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2932 |
// Find the lock address and load the displaced header from the stack. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2933 |
ld(displaced_header, BasicLock::displaced_header_offset_in_bytes(), box); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2934 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2935 |
// If the displaced header is 0, we have a recursive unlock. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2936 |
cmpdi(flag, displaced_header, 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2937 |
beq(flag, cont); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2938 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2939 |
// Handle existing monitor. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2940 |
if ((EmitSync & 0x02) == 0) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2941 |
// The object has an existing monitor iff (mark & monitor_value) != 0. |
30303 | 2942 |
RTM_OPT_ONLY( if (!(UseRTMForStackLocks && use_rtm)) ) // skip load if already done |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2943 |
ld(current_header, oopDesc::mark_offset_in_bytes(), oop); |
30303 | 2944 |
andi_(R0, current_header, markOopDesc::monitor_value); |
2945 |
bne(CCR0, object_has_monitor); |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2946 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2947 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2948 |
// Check if it is still a light weight lock, this is is true if we see |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2949 |
// the stack address of the basicLock in the markOop of the object. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2950 |
// Cmpxchg sets flag to cmpd(current_header, box). |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2951 |
cmpxchgd(/*flag=*/flag, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2952 |
/*current_value=*/current_header, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2953 |
/*compare_value=*/box, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2954 |
/*exchange_value=*/displaced_header, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2955 |
/*where=*/oop, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2956 |
MacroAssembler::MemBarRel, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2957 |
MacroAssembler::cmpxchgx_hint_release_lock(), |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2958 |
noreg, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2959 |
&cont); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2960 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2961 |
assert(oopDesc::mark_offset_in_bytes() == 0, "offset of _mark is not 0"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2962 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2963 |
// Handle existing monitor. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2964 |
if ((EmitSync & 0x02) == 0) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2965 |
b(cont); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2966 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2967 |
bind(object_has_monitor); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2968 |
addi(current_header, current_header, -markOopDesc::monitor_value); // monitor |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2969 |
ld(temp, ObjectMonitor::owner_offset_in_bytes(), current_header); |
30303 | 2970 |
|
2971 |
// It's inflated. |
|
2972 |
#if INCLUDE_RTM_OPT |
|
2973 |
if (use_rtm) { |
|
2974 |
Label L_regular_inflated_unlock; |
|
2975 |
// Clean monitor_value bit to get valid pointer |
|
2976 |
cmpdi(flag, temp, 0); |
|
2977 |
bne(flag, L_regular_inflated_unlock); |
|
2978 |
tend_(); |
|
2979 |
b(cont); |
|
2980 |
bind(L_regular_inflated_unlock); |
|
2981 |
} |
|
2982 |
#endif |
|
2983 |
||
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2984 |
ld(displaced_header, ObjectMonitor::recursions_offset_in_bytes(), current_header); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2985 |
xorr(temp, R16_thread, temp); // Will be 0 if we are the owner. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2986 |
orr(temp, temp, displaced_header); // Will be 0 if there are 0 recursions. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2987 |
cmpdi(flag, temp, 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2988 |
bne(flag, cont); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2989 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2990 |
ld(temp, ObjectMonitor::EntryList_offset_in_bytes(), current_header); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2991 |
ld(displaced_header, ObjectMonitor::cxq_offset_in_bytes(), current_header); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2992 |
orr(temp, temp, displaced_header); // Will be 0 if both are 0. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2993 |
cmpdi(flag, temp, 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2994 |
bne(flag, cont); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2995 |
release(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2996 |
std(temp, ObjectMonitor::owner_offset_in_bytes(), current_header); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2997 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2998 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
2999 |
bind(cont); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3000 |
// flag == EQ indicates success |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3001 |
// flag == NE indicates failure |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3002 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3003 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3004 |
// Write serialization page so VM thread can do a pseudo remote membar. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3005 |
// We use the current thread pointer to calculate a thread specific |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3006 |
// offset to write to within the page. This minimizes bus traffic |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3007 |
// due to cache line collision. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3008 |
void MacroAssembler::serialize_memory(Register thread, Register tmp1, Register tmp2) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3009 |
srdi(tmp2, thread, os::get_serialize_page_shift_count()); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3010 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3011 |
int mask = os::vm_page_size() - sizeof(int); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3012 |
if (Assembler::is_simm(mask, 16)) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3013 |
andi(tmp2, tmp2, mask); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3014 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3015 |
lis(tmp1, (int)((signed short) (mask >> 16))); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3016 |
ori(tmp1, tmp1, mask & 0x0000ffff); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3017 |
andr(tmp2, tmp2, tmp1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3018 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3019 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3020 |
load_const(tmp1, (long) os::get_memory_serialize_page()); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3021 |
release(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3022 |
stwx(R0, tmp1, tmp2); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3023 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3024 |
|
48332
651a95f30dfb
8193257: PPC64, s390 implementation for Thread-local handshakes
mdoerr
parents:
47580
diff
changeset
|
3025 |
void MacroAssembler::safepoint_poll(Label& slow_path, Register temp_reg) { |
651a95f30dfb
8193257: PPC64, s390 implementation for Thread-local handshakes
mdoerr
parents:
47580
diff
changeset
|
3026 |
if (SafepointMechanism::uses_thread_local_poll()) { |
651a95f30dfb
8193257: PPC64, s390 implementation for Thread-local handshakes
mdoerr
parents:
47580
diff
changeset
|
3027 |
ld(temp_reg, in_bytes(Thread::polling_page_offset()), R16_thread); |
651a95f30dfb
8193257: PPC64, s390 implementation for Thread-local handshakes
mdoerr
parents:
47580
diff
changeset
|
3028 |
// Armed page has poll_bit set. |
651a95f30dfb
8193257: PPC64, s390 implementation for Thread-local handshakes
mdoerr
parents:
47580
diff
changeset
|
3029 |
andi_(temp_reg, temp_reg, SafepointMechanism::poll_bit()); |
651a95f30dfb
8193257: PPC64, s390 implementation for Thread-local handshakes
mdoerr
parents:
47580
diff
changeset
|
3030 |
} else { |
651a95f30dfb
8193257: PPC64, s390 implementation for Thread-local handshakes
mdoerr
parents:
47580
diff
changeset
|
3031 |
lwz(temp_reg, (RegisterOrConstant)(intptr_t)SafepointSynchronize::address_of_state()); |
651a95f30dfb
8193257: PPC64, s390 implementation for Thread-local handshakes
mdoerr
parents:
47580
diff
changeset
|
3032 |
cmpwi(CCR0, temp_reg, SafepointSynchronize::_not_synchronized); |
651a95f30dfb
8193257: PPC64, s390 implementation for Thread-local handshakes
mdoerr
parents:
47580
diff
changeset
|
3033 |
} |
651a95f30dfb
8193257: PPC64, s390 implementation for Thread-local handshakes
mdoerr
parents:
47580
diff
changeset
|
3034 |
bne(CCR0, slow_path); |
651a95f30dfb
8193257: PPC64, s390 implementation for Thread-local handshakes
mdoerr
parents:
47580
diff
changeset
|
3035 |
} |
651a95f30dfb
8193257: PPC64, s390 implementation for Thread-local handshakes
mdoerr
parents:
47580
diff
changeset
|
3036 |
|
44406
a46a6c4d1dd9
8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents:
44093
diff
changeset
|
3037 |
void MacroAssembler::resolve_jobject(Register value, Register tmp1, Register tmp2, bool needs_frame) { |
49754 | 3038 |
BarrierSetAssembler* bs = BarrierSet::barrier_set()->barrier_set_assembler(); |
49748 | 3039 |
bs->resolve_jobject(this, value, tmp1, tmp2, needs_frame); |
44406
a46a6c4d1dd9
8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents:
44093
diff
changeset
|
3040 |
} |
a46a6c4d1dd9
8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents:
44093
diff
changeset
|
3041 |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3042 |
// Values for last_Java_pc, and last_Java_sp must comply to the rules |
27012 | 3043 |
// in frame_ppc.hpp. |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3044 |
void MacroAssembler::set_last_Java_frame(Register last_Java_sp, Register last_Java_pc) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3045 |
// Always set last_Java_pc and flags first because once last_Java_sp |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3046 |
// is visible has_last_Java_frame is true and users will look at the |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3047 |
// rest of the fields. (Note: flags should always be zero before we |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3048 |
// get here so doesn't need to be set.) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3049 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3050 |
// Verify that last_Java_pc was zeroed on return to Java |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3051 |
asm_assert_mem8_is_zero(in_bytes(JavaThread::last_Java_pc_offset()), R16_thread, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3052 |
"last_Java_pc not zeroed before leaving Java", 0x200); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3053 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3054 |
// When returning from calling out from Java mode the frame anchor's |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3055 |
// last_Java_pc will always be set to NULL. It is set here so that |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3056 |
// if we are doing a call to native (not VM) that we capture the |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3057 |
// known pc and don't have to rely on the native call having a |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3058 |
// standard frame linkage where we can find the pc. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3059 |
if (last_Java_pc != noreg) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3060 |
std(last_Java_pc, in_bytes(JavaThread::last_Java_pc_offset()), R16_thread); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3061 |
|
22861 | 3062 |
// Set last_Java_sp last. |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3063 |
std(last_Java_sp, in_bytes(JavaThread::last_Java_sp_offset()), R16_thread); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3064 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3065 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3066 |
void MacroAssembler::reset_last_Java_frame(void) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3067 |
asm_assert_mem8_isnot_zero(in_bytes(JavaThread::last_Java_sp_offset()), |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3068 |
R16_thread, "SP was not set, still zero", 0x202); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3069 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3070 |
BLOCK_COMMENT("reset_last_Java_frame {"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3071 |
li(R0, 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3072 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3073 |
// _last_Java_sp = 0 |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3074 |
std(R0, in_bytes(JavaThread::last_Java_sp_offset()), R16_thread); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3075 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3076 |
// _last_Java_pc = 0 |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3077 |
std(R0, in_bytes(JavaThread::last_Java_pc_offset()), R16_thread); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3078 |
BLOCK_COMMENT("} reset_last_Java_frame"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3079 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3080 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3081 |
void MacroAssembler::set_top_ijava_frame_at_SP_as_last_Java_frame(Register sp, Register tmp1) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3082 |
assert_different_registers(sp, tmp1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3083 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3084 |
// sp points to a TOP_IJAVA_FRAME, retrieve frame's PC via |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3085 |
// TOP_IJAVA_FRAME_ABI. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3086 |
// FIXME: assert that we really have a TOP_IJAVA_FRAME here! |
23221 | 3087 |
address entry = pc(); |
3088 |
load_const_optimized(tmp1, entry); |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3089 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3090 |
set_last_Java_frame(/*sp=*/sp, /*pc=*/tmp1); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3091 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3092 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3093 |
void MacroAssembler::get_vm_result(Register oop_result) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3094 |
// Read: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3095 |
// R16_thread |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3096 |
// R16_thread->in_bytes(JavaThread::vm_result_offset()) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3097 |
// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3098 |
// Updated: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3099 |
// oop_result |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3100 |
// R16_thread->in_bytes(JavaThread::vm_result_offset()) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3101 |
|
30303 | 3102 |
verify_thread(); |
3103 |
||
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3104 |
ld(oop_result, in_bytes(JavaThread::vm_result_offset()), R16_thread); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3105 |
li(R0, 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3106 |
std(R0, in_bytes(JavaThread::vm_result_offset()), R16_thread); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3107 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3108 |
verify_oop(oop_result); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3109 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3110 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3111 |
void MacroAssembler::get_vm_result_2(Register metadata_result) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3112 |
// Read: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3113 |
// R16_thread |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3114 |
// R16_thread->in_bytes(JavaThread::vm_result_2_offset()) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3115 |
// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3116 |
// Updated: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3117 |
// metadata_result |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3118 |
// R16_thread->in_bytes(JavaThread::vm_result_2_offset()) |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3119 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3120 |
ld(metadata_result, in_bytes(JavaThread::vm_result_2_offset()), R16_thread); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3121 |
li(R0, 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3122 |
std(R0, in_bytes(JavaThread::vm_result_2_offset()), R16_thread); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3123 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3124 |
|
30303 | 3125 |
Register MacroAssembler::encode_klass_not_null(Register dst, Register src) { |
22867 | 3126 |
Register current = (src != noreg) ? src : dst; // Klass is in dst if no src provided. |
22843
b245fac3b6a4
8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents:
22840
diff
changeset
|
3127 |
if (Universe::narrow_klass_base() != 0) { |
23492 | 3128 |
// Use dst as temp if it is free. |
30303 | 3129 |
sub_const_optimized(dst, current, Universe::narrow_klass_base(), R0); |
22867 | 3130 |
current = dst; |
22843
b245fac3b6a4
8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents:
22840
diff
changeset
|
3131 |
} |
22867 | 3132 |
if (Universe::narrow_klass_shift() != 0) { |
3133 |
srdi(dst, current, Universe::narrow_klass_shift()); |
|
3134 |
current = dst; |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3135 |
} |
30303 | 3136 |
return current; |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3137 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3138 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3139 |
void MacroAssembler::store_klass(Register dst_oop, Register klass, Register ck) { |
22840
e544827769a7
8027965: Adapt PPC to 8015107: NPG: Use consistent naming for metaspace concepts
goetz
parents:
22829
diff
changeset
|
3140 |
if (UseCompressedClassPointers) { |
30303 | 3141 |
Register compressedKlass = encode_klass_not_null(ck, klass); |
3142 |
stw(compressedKlass, oopDesc::klass_offset_in_bytes(), dst_oop); |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3143 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3144 |
std(klass, oopDesc::klass_offset_in_bytes(), dst_oop); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3145 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3146 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3147 |
|
23221 | 3148 |
void MacroAssembler::store_klass_gap(Register dst_oop, Register val) { |
3149 |
if (UseCompressedClassPointers) { |
|
3150 |
if (val == noreg) { |
|
3151 |
val = R0; |
|
3152 |
li(val, 0); |
|
3153 |
} |
|
3154 |
stw(val, oopDesc::klass_gap_offset_in_bytes(), dst_oop); // klass gap if compressed |
|
3155 |
} |
|
3156 |
} |
|
3157 |
||
22843
b245fac3b6a4
8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents:
22840
diff
changeset
|
3158 |
int MacroAssembler::instr_size_for_decode_klass_not_null() { |
b245fac3b6a4
8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents:
22840
diff
changeset
|
3159 |
if (!UseCompressedClassPointers) return 0; |
b245fac3b6a4
8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents:
22840
diff
changeset
|
3160 |
int num_instrs = 1; // shift or move |
b245fac3b6a4
8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents:
22840
diff
changeset
|
3161 |
if (Universe::narrow_klass_base() != 0) num_instrs = 7; // shift + load const + add |
b245fac3b6a4
8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents:
22840
diff
changeset
|
3162 |
return num_instrs * BytesPerInstWord; |
b245fac3b6a4
8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents:
22840
diff
changeset
|
3163 |
} |
b245fac3b6a4
8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents:
22840
diff
changeset
|
3164 |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3165 |
void MacroAssembler::decode_klass_not_null(Register dst, Register src) { |
27012 | 3166 |
assert(dst != R0, "Dst reg may not be R0, as R0 is used here."); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3167 |
if (src == noreg) src = dst; |
22829 | 3168 |
Register shifted_src = src; |
22843
b245fac3b6a4
8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents:
22840
diff
changeset
|
3169 |
if (Universe::narrow_klass_shift() != 0 || |
b245fac3b6a4
8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents:
22840
diff
changeset
|
3170 |
Universe::narrow_klass_base() == 0 && src != dst) { // Move required. |
22829 | 3171 |
shifted_src = dst; |
3172 |
sldi(shifted_src, src, Universe::narrow_klass_shift()); |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3173 |
} |
22843
b245fac3b6a4
8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents:
22840
diff
changeset
|
3174 |
if (Universe::narrow_klass_base() != 0) { |
30303 | 3175 |
add_const_optimized(dst, shifted_src, Universe::narrow_klass_base(), R0); |
22843
b245fac3b6a4
8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents:
22840
diff
changeset
|
3176 |
} |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3177 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3178 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3179 |
void MacroAssembler::load_klass(Register dst, Register src) { |
22840
e544827769a7
8027965: Adapt PPC to 8015107: NPG: Use consistent naming for metaspace concepts
goetz
parents:
22829
diff
changeset
|
3180 |
if (UseCompressedClassPointers) { |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3181 |
lwz(dst, oopDesc::klass_offset_in_bytes(), src); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3182 |
// Attention: no null check here! |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3183 |
decode_klass_not_null(dst, dst); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3184 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3185 |
ld(dst, oopDesc::klass_offset_in_bytes(), src); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3186 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3187 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3188 |
|
46961
c9094b1e5f87
8186088: ConstantPoolCache::_resolved_references is not a JNIHandle
coleenp
parents:
46789
diff
changeset
|
3189 |
// ((OopHandle)result).resolve(); |
c9094b1e5f87
8186088: ConstantPoolCache::_resolved_references is not a JNIHandle
coleenp
parents:
46789
diff
changeset
|
3190 |
void MacroAssembler::resolve_oop_handle(Register result) { |
c9094b1e5f87
8186088: ConstantPoolCache::_resolved_references is not a JNIHandle
coleenp
parents:
46789
diff
changeset
|
3191 |
// OopHandle::resolve is an indirection. |
c9094b1e5f87
8186088: ConstantPoolCache::_resolved_references is not a JNIHandle
coleenp
parents:
46789
diff
changeset
|
3192 |
ld(result, 0, result); |
c9094b1e5f87
8186088: ConstantPoolCache::_resolved_references is not a JNIHandle
coleenp
parents:
46789
diff
changeset
|
3193 |
} |
c9094b1e5f87
8186088: ConstantPoolCache::_resolved_references is not a JNIHandle
coleenp
parents:
46789
diff
changeset
|
3194 |
|
42068
18c8a4d5998e
8168083: PPC64: Cleanup template interpreter after 8154580 and 8154867
mdoerr
parents:
41334
diff
changeset
|
3195 |
void MacroAssembler::load_mirror_from_const_method(Register mirror, Register const_method) { |
18c8a4d5998e
8168083: PPC64: Cleanup template interpreter after 8154580 and 8154867
mdoerr
parents:
41334
diff
changeset
|
3196 |
ld(mirror, in_bytes(ConstMethod::constants_offset()), const_method); |
38074
8475fdc6dcc3
8154580: Save mirror in interpreter frame to enable cleanups of CLDClosure
coleenp
parents:
36303
diff
changeset
|
3197 |
ld(mirror, ConstantPool::pool_holder_offset_in_bytes(), mirror); |
42068
18c8a4d5998e
8168083: PPC64: Cleanup template interpreter after 8154580 and 8154867
mdoerr
parents:
41334
diff
changeset
|
3198 |
ld(mirror, in_bytes(Klass::java_mirror_offset()), mirror); |
47580 | 3199 |
resolve_oop_handle(mirror); |
38074
8475fdc6dcc3
8154580: Save mirror in interpreter frame to enable cleanups of CLDClosure
coleenp
parents:
36303
diff
changeset
|
3200 |
} |
8475fdc6dcc3
8154580: Save mirror in interpreter frame to enable cleanups of CLDClosure
coleenp
parents:
36303
diff
changeset
|
3201 |
|
22861 | 3202 |
// Clear Array |
42661
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3203 |
// For very short arrays. tmp == R0 is allowed. |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3204 |
void MacroAssembler::clear_memory_unrolled(Register base_ptr, int cnt_dwords, Register tmp, int offset) { |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3205 |
if (cnt_dwords > 0) { li(tmp, 0); } |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3206 |
for (int i = 0; i < cnt_dwords; ++i) { std(tmp, offset + i * 8, base_ptr); } |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3207 |
} |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3208 |
|
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3209 |
// Version for constant short array length. Kills base_ptr. tmp == R0 is allowed. |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3210 |
void MacroAssembler::clear_memory_constlen(Register base_ptr, int cnt_dwords, Register tmp) { |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3211 |
if (cnt_dwords < 8) { |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3212 |
clear_memory_unrolled(base_ptr, cnt_dwords, tmp); |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3213 |
return; |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3214 |
} |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3215 |
|
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3216 |
Label loop; |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3217 |
const long loopcnt = cnt_dwords >> 1, |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3218 |
remainder = cnt_dwords & 1; |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3219 |
|
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3220 |
li(tmp, loopcnt); |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3221 |
mtctr(tmp); |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3222 |
li(tmp, 0); |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3223 |
bind(loop); |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3224 |
std(tmp, 0, base_ptr); |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3225 |
std(tmp, 8, base_ptr); |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3226 |
addi(base_ptr, base_ptr, 16); |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3227 |
bdnz(loop); |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3228 |
if (remainder) { std(tmp, 0, base_ptr); } |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3229 |
} |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3230 |
|
22861 | 3231 |
// Kills both input registers. tmp == R0 is allowed. |
42661
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3232 |
void MacroAssembler::clear_memory_doubleword(Register base_ptr, Register cnt_dwords, Register tmp, long const_cnt) { |
22861 | 3233 |
// Procedure for large arrays (uses data cache block zero instruction). |
3234 |
Label startloop, fast, fastloop, small_rest, restloop, done; |
|
35085 | 3235 |
const int cl_size = VM_Version::L1_data_cache_line_size(), |
42661
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3236 |
cl_dwords = cl_size >> 3, |
22861 | 3237 |
cl_dw_addr_bits = exact_log2(cl_dwords), |
42661
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3238 |
dcbz_min = 1, // Min count of dcbz executions, needs to be >0. |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3239 |
min_cnt = ((dcbz_min + 1) << cl_dw_addr_bits) - 1; |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3240 |
|
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3241 |
if (const_cnt >= 0) { |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3242 |
// Constant case. |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3243 |
if (const_cnt < min_cnt) { |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3244 |
clear_memory_constlen(base_ptr, const_cnt, tmp); |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3245 |
return; |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3246 |
} |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3247 |
load_const_optimized(cnt_dwords, const_cnt, tmp); |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3248 |
} else { |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3249 |
// cnt_dwords already loaded in register. Need to check size. |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3250 |
cmpdi(CCR1, cnt_dwords, min_cnt); // Big enough? (ensure >= dcbz_min lines included). |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3251 |
blt(CCR1, small_rest); |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3252 |
} |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3253 |
rldicl_(tmp, base_ptr, 64-3, 64-cl_dw_addr_bits); // Extract dword offset within first cache line. |
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3254 |
beq(CCR0, fast); // Already 128byte aligned. |
22861 | 3255 |
|
3256 |
subfic(tmp, tmp, cl_dwords); |
|
3257 |
mtctr(tmp); // Set ctr to hit 128byte boundary (0<ctr<cl_dwords). |
|
3258 |
subf(cnt_dwords, tmp, cnt_dwords); // rest. |
|
3259 |
li(tmp, 0); |
|
42661
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3260 |
|
22861 | 3261 |
bind(startloop); // Clear at the beginning to reach 128byte boundary. |
3262 |
std(tmp, 0, base_ptr); // Clear 8byte aligned block. |
|
3263 |
addi(base_ptr, base_ptr, 8); |
|
3264 |
bdnz(startloop); |
|
42661
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3265 |
|
22861 | 3266 |
bind(fast); // Clear 128byte blocks. |
3267 |
srdi(tmp, cnt_dwords, cl_dw_addr_bits); // Loop count for 128byte loop (>0). |
|
3268 |
andi(cnt_dwords, cnt_dwords, cl_dwords-1); // Rest in dwords. |
|
3269 |
mtctr(tmp); // Load counter. |
|
42661
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3270 |
|
22861 | 3271 |
bind(fastloop); |
3272 |
dcbz(base_ptr); // Clear 128byte aligned block. |
|
3273 |
addi(base_ptr, base_ptr, cl_size); |
|
3274 |
bdnz(fastloop); |
|
42661
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3275 |
|
22861 | 3276 |
bind(small_rest); |
3277 |
cmpdi(CCR0, cnt_dwords, 0); // size 0? |
|
3278 |
beq(CCR0, done); // rest == 0 |
|
3279 |
li(tmp, 0); |
|
3280 |
mtctr(cnt_dwords); // Load counter. |
|
42661
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3281 |
|
22861 | 3282 |
bind(restloop); // Clear rest. |
3283 |
std(tmp, 0, base_ptr); // Clear 8byte aligned block. |
|
3284 |
addi(base_ptr, base_ptr, 8); |
|
3285 |
bdnz(restloop); |
|
42661
2343dd675325
8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents:
42068
diff
changeset
|
3286 |
|
22861 | 3287 |
bind(done); |
3288 |
} |
|
3289 |
||
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3290 |
/////////////////////////////////////////// String intrinsics //////////////////////////////////////////// |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
3291 |
|
36303
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3292 |
#ifdef COMPILER2 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3293 |
// Intrinsics for CompactStrings |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3294 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3295 |
// Compress char[] to byte[] by compressing 16 bytes at once. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3296 |
void MacroAssembler::string_compress_16(Register src, Register dst, Register cnt, |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3297 |
Register tmp1, Register tmp2, Register tmp3, Register tmp4, Register tmp5, |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3298 |
Label& Lfailure) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3299 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3300 |
const Register tmp0 = R0; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3301 |
assert_different_registers(src, dst, cnt, tmp0, tmp1, tmp2, tmp3, tmp4, tmp5); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3302 |
Label Lloop, Lslow; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3303 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3304 |
// Check if cnt >= 8 (= 16 bytes) |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3305 |
lis(tmp1, 0xFF); // tmp1 = 0x00FF00FF00FF00FF |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3306 |
srwi_(tmp2, cnt, 3); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3307 |
beq(CCR0, Lslow); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3308 |
ori(tmp1, tmp1, 0xFF); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3309 |
rldimi(tmp1, tmp1, 32, 0); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3310 |
mtctr(tmp2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3311 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3312 |
// 2x unrolled loop |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3313 |
bind(Lloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3314 |
ld(tmp2, 0, src); // _0_1_2_3 (Big Endian) |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3315 |
ld(tmp4, 8, src); // _4_5_6_7 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3316 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3317 |
orr(tmp0, tmp2, tmp4); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3318 |
rldicl(tmp3, tmp2, 6*8, 64-24); // _____1_2 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3319 |
rldimi(tmp2, tmp2, 2*8, 2*8); // _0_2_3_3 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3320 |
rldicl(tmp5, tmp4, 6*8, 64-24); // _____5_6 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3321 |
rldimi(tmp4, tmp4, 2*8, 2*8); // _4_6_7_7 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3322 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3323 |
andc_(tmp0, tmp0, tmp1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3324 |
bne(CCR0, Lfailure); // Not latin1. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3325 |
addi(src, src, 16); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3326 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3327 |
rlwimi(tmp3, tmp2, 0*8, 24, 31);// _____1_3 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3328 |
srdi(tmp2, tmp2, 3*8); // ____0_2_ |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3329 |
rlwimi(tmp5, tmp4, 0*8, 24, 31);// _____5_7 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3330 |
srdi(tmp4, tmp4, 3*8); // ____4_6_ |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3331 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3332 |
orr(tmp2, tmp2, tmp3); // ____0123 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3333 |
orr(tmp4, tmp4, tmp5); // ____4567 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3334 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3335 |
stw(tmp2, 0, dst); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3336 |
stw(tmp4, 4, dst); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3337 |
addi(dst, dst, 8); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3338 |
bdnz(Lloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3339 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3340 |
bind(Lslow); // Fallback to slow version |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3341 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3342 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3343 |
// Compress char[] to byte[]. cnt must be positive int. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3344 |
void MacroAssembler::string_compress(Register src, Register dst, Register cnt, Register tmp, Label& Lfailure) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3345 |
Label Lloop; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3346 |
mtctr(cnt); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3347 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3348 |
bind(Lloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3349 |
lhz(tmp, 0, src); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3350 |
cmplwi(CCR0, tmp, 0xff); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3351 |
bgt(CCR0, Lfailure); // Not latin1. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3352 |
addi(src, src, 2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3353 |
stb(tmp, 0, dst); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3354 |
addi(dst, dst, 1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3355 |
bdnz(Lloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3356 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3357 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3358 |
// Inflate byte[] to char[] by inflating 16 bytes at once. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3359 |
void MacroAssembler::string_inflate_16(Register src, Register dst, Register cnt, |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3360 |
Register tmp1, Register tmp2, Register tmp3, Register tmp4, Register tmp5) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3361 |
const Register tmp0 = R0; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3362 |
assert_different_registers(src, dst, cnt, tmp0, tmp1, tmp2, tmp3, tmp4, tmp5); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3363 |
Label Lloop, Lslow; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3364 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3365 |
// Check if cnt >= 8 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3366 |
srwi_(tmp2, cnt, 3); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3367 |
beq(CCR0, Lslow); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3368 |
lis(tmp1, 0xFF); // tmp1 = 0x00FF00FF |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3369 |
ori(tmp1, tmp1, 0xFF); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3370 |
mtctr(tmp2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3371 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3372 |
// 2x unrolled loop |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3373 |
bind(Lloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3374 |
lwz(tmp2, 0, src); // ____0123 (Big Endian) |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3375 |
lwz(tmp4, 4, src); // ____4567 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3376 |
addi(src, src, 8); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3377 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3378 |
rldicl(tmp3, tmp2, 7*8, 64-8); // _______2 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3379 |
rlwimi(tmp2, tmp2, 3*8, 16, 23);// ____0113 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3380 |
rldicl(tmp5, tmp4, 7*8, 64-8); // _______6 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3381 |
rlwimi(tmp4, tmp4, 3*8, 16, 23);// ____4557 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3382 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3383 |
andc(tmp0, tmp2, tmp1); // ____0_1_ |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3384 |
rlwimi(tmp2, tmp3, 2*8, 0, 23); // _____2_3 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3385 |
andc(tmp3, tmp4, tmp1); // ____4_5_ |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3386 |
rlwimi(tmp4, tmp5, 2*8, 0, 23); // _____6_7 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3387 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3388 |
rldimi(tmp2, tmp0, 3*8, 0*8); // _0_1_2_3 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3389 |
rldimi(tmp4, tmp3, 3*8, 0*8); // _4_5_6_7 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3390 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3391 |
std(tmp2, 0, dst); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3392 |
std(tmp4, 8, dst); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3393 |
addi(dst, dst, 16); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3394 |
bdnz(Lloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3395 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3396 |
bind(Lslow); // Fallback to slow version |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3397 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3398 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3399 |
// Inflate byte[] to char[]. cnt must be positive int. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3400 |
void MacroAssembler::string_inflate(Register src, Register dst, Register cnt, Register tmp) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3401 |
Label Lloop; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3402 |
mtctr(cnt); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3403 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3404 |
bind(Lloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3405 |
lbz(tmp, 0, src); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3406 |
addi(src, src, 1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3407 |
sth(tmp, 0, dst); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3408 |
addi(dst, dst, 2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3409 |
bdnz(Lloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3410 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3411 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3412 |
void MacroAssembler::string_compare(Register str1, Register str2, |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3413 |
Register cnt1, Register cnt2, |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3414 |
Register tmp1, Register result, int ae) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3415 |
const Register tmp0 = R0, |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3416 |
diff = tmp1; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3417 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3418 |
assert_different_registers(str1, str2, cnt1, cnt2, tmp0, tmp1, result); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3419 |
Label Ldone, Lslow, Lloop, Lreturn_diff; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3420 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3421 |
// Note: Making use of the fact that compareTo(a, b) == -compareTo(b, a) |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3422 |
// we interchange str1 and str2 in the UL case and negate the result. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3423 |
// Like this, str1 is always latin1 encoded, except for the UU case. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3424 |
// In addition, we need 0 (or sign which is 0) extend. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3425 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3426 |
if (ae == StrIntrinsicNode::UU) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3427 |
srwi(cnt1, cnt1, 1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3428 |
} else { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3429 |
clrldi(cnt1, cnt1, 32); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3430 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3431 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3432 |
if (ae != StrIntrinsicNode::LL) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3433 |
srwi(cnt2, cnt2, 1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3434 |
} else { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3435 |
clrldi(cnt2, cnt2, 32); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3436 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3437 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3438 |
// See if the lengths are different, and calculate min in cnt1. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3439 |
// Save diff in case we need it for a tie-breaker. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3440 |
subf_(diff, cnt2, cnt1); // diff = cnt1 - cnt2 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3441 |
// if (diff > 0) { cnt1 = cnt2; } |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3442 |
if (VM_Version::has_isel()) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3443 |
isel(cnt1, CCR0, Assembler::greater, /*invert*/ false, cnt2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3444 |
} else { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3445 |
Label Lskip; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3446 |
blt(CCR0, Lskip); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3447 |
mr(cnt1, cnt2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3448 |
bind(Lskip); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3449 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3450 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3451 |
// Rename registers |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3452 |
Register chr1 = result; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3453 |
Register chr2 = tmp0; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3454 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3455 |
// Compare multiple characters in fast loop (only implemented for same encoding). |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3456 |
int stride1 = 8, stride2 = 8; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3457 |
if (ae == StrIntrinsicNode::LL || ae == StrIntrinsicNode::UU) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3458 |
int log2_chars_per_iter = (ae == StrIntrinsicNode::LL) ? 3 : 2; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3459 |
Label Lfastloop, Lskipfast; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3460 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3461 |
srwi_(tmp0, cnt1, log2_chars_per_iter); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3462 |
beq(CCR0, Lskipfast); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3463 |
rldicl(cnt2, cnt1, 0, 64 - log2_chars_per_iter); // Remaining characters. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3464 |
li(cnt1, 1 << log2_chars_per_iter); // Initialize for failure case: Rescan characters from current iteration. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3465 |
mtctr(tmp0); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3466 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3467 |
bind(Lfastloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3468 |
ld(chr1, 0, str1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3469 |
ld(chr2, 0, str2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3470 |
cmpd(CCR0, chr1, chr2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3471 |
bne(CCR0, Lslow); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3472 |
addi(str1, str1, stride1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3473 |
addi(str2, str2, stride2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3474 |
bdnz(Lfastloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3475 |
mr(cnt1, cnt2); // Remaining characters. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3476 |
bind(Lskipfast); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3477 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3478 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3479 |
// Loop which searches the first difference character by character. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3480 |
cmpwi(CCR0, cnt1, 0); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3481 |
beq(CCR0, Lreturn_diff); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3482 |
bind(Lslow); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3483 |
mtctr(cnt1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3484 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3485 |
switch (ae) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3486 |
case StrIntrinsicNode::LL: stride1 = 1; stride2 = 1; break; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3487 |
case StrIntrinsicNode::UL: // fallthru (see comment above) |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3488 |
case StrIntrinsicNode::LU: stride1 = 1; stride2 = 2; break; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3489 |
case StrIntrinsicNode::UU: stride1 = 2; stride2 = 2; break; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3490 |
default: ShouldNotReachHere(); break; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3491 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3492 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3493 |
bind(Lloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3494 |
if (stride1 == 1) { lbz(chr1, 0, str1); } else { lhz(chr1, 0, str1); } |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3495 |
if (stride2 == 1) { lbz(chr2, 0, str2); } else { lhz(chr2, 0, str2); } |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3496 |
subf_(result, chr2, chr1); // result = chr1 - chr2 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3497 |
bne(CCR0, Ldone); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3498 |
addi(str1, str1, stride1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3499 |
addi(str2, str2, stride2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3500 |
bdnz(Lloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3501 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3502 |
// If strings are equal up to min length, return the length difference. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3503 |
bind(Lreturn_diff); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3504 |
mr(result, diff); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3505 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3506 |
// Otherwise, return the difference between the first mismatched chars. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3507 |
bind(Ldone); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3508 |
if (ae == StrIntrinsicNode::UL) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3509 |
neg(result, result); // Negate result (see note above). |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3510 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3511 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3512 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3513 |
void MacroAssembler::array_equals(bool is_array_equ, Register ary1, Register ary2, |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3514 |
Register limit, Register tmp1, Register result, bool is_byte) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3515 |
const Register tmp0 = R0; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3516 |
assert_different_registers(ary1, ary2, limit, tmp0, tmp1, result); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3517 |
Label Ldone, Lskiploop, Lloop, Lfastloop, Lskipfast; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3518 |
bool limit_needs_shift = false; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3519 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3520 |
if (is_array_equ) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3521 |
const int length_offset = arrayOopDesc::length_offset_in_bytes(); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3522 |
const int base_offset = arrayOopDesc::base_offset_in_bytes(is_byte ? T_BYTE : T_CHAR); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3523 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3524 |
// Return true if the same array. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3525 |
cmpd(CCR0, ary1, ary2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3526 |
beq(CCR0, Lskiploop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3527 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3528 |
// Return false if one of them is NULL. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3529 |
cmpdi(CCR0, ary1, 0); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3530 |
cmpdi(CCR1, ary2, 0); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3531 |
li(result, 0); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3532 |
cror(CCR0, Assembler::equal, CCR1, Assembler::equal); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3533 |
beq(CCR0, Ldone); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3534 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3535 |
// Load the lengths of arrays. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3536 |
lwz(limit, length_offset, ary1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3537 |
lwz(tmp0, length_offset, ary2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3538 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3539 |
// Return false if the two arrays are not equal length. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3540 |
cmpw(CCR0, limit, tmp0); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3541 |
bne(CCR0, Ldone); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3542 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3543 |
// Load array addresses. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3544 |
addi(ary1, ary1, base_offset); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3545 |
addi(ary2, ary2, base_offset); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3546 |
} else { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3547 |
limit_needs_shift = !is_byte; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3548 |
li(result, 0); // Assume not equal. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3549 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3550 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3551 |
// Rename registers |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3552 |
Register chr1 = tmp0; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3553 |
Register chr2 = tmp1; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3554 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3555 |
// Compare 8 bytes per iteration in fast loop. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3556 |
const int log2_chars_per_iter = is_byte ? 3 : 2; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3557 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3558 |
srwi_(tmp0, limit, log2_chars_per_iter + (limit_needs_shift ? 1 : 0)); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3559 |
beq(CCR0, Lskipfast); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3560 |
mtctr(tmp0); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3561 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3562 |
bind(Lfastloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3563 |
ld(chr1, 0, ary1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3564 |
ld(chr2, 0, ary2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3565 |
addi(ary1, ary1, 8); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3566 |
addi(ary2, ary2, 8); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3567 |
cmpd(CCR0, chr1, chr2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3568 |
bne(CCR0, Ldone); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3569 |
bdnz(Lfastloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3570 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3571 |
bind(Lskipfast); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3572 |
rldicl_(limit, limit, limit_needs_shift ? 64 - 1 : 0, 64 - log2_chars_per_iter); // Remaining characters. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3573 |
beq(CCR0, Lskiploop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3574 |
mtctr(limit); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3575 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3576 |
// Character by character. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3577 |
bind(Lloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3578 |
if (is_byte) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3579 |
lbz(chr1, 0, ary1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3580 |
lbz(chr2, 0, ary2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3581 |
addi(ary1, ary1, 1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3582 |
addi(ary2, ary2, 1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3583 |
} else { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3584 |
lhz(chr1, 0, ary1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3585 |
lhz(chr2, 0, ary2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3586 |
addi(ary1, ary1, 2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3587 |
addi(ary2, ary2, 2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3588 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3589 |
cmpw(CCR0, chr1, chr2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3590 |
bne(CCR0, Ldone); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3591 |
bdnz(Lloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3592 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3593 |
bind(Lskiploop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3594 |
li(result, 1); // All characters are equal. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3595 |
bind(Ldone); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3596 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3597 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3598 |
void MacroAssembler::string_indexof(Register result, Register haystack, Register haycnt, |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3599 |
Register needle, ciTypeArray* needle_values, Register needlecnt, int needlecntval, |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3600 |
Register tmp1, Register tmp2, Register tmp3, Register tmp4, int ae) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3601 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3602 |
// Ensure 0<needlecnt<=haycnt in ideal graph as prerequisite! |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3603 |
Label L_TooShort, L_Found, L_NotFound, L_End; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3604 |
Register last_addr = haycnt, // Kill haycnt at the beginning. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3605 |
addr = tmp1, |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3606 |
n_start = tmp2, |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3607 |
ch1 = tmp3, |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3608 |
ch2 = R0; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3609 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3610 |
assert(ae != StrIntrinsicNode::LU, "Invalid encoding"); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3611 |
const int h_csize = (ae == StrIntrinsicNode::LL) ? 1 : 2; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3612 |
const int n_csize = (ae == StrIntrinsicNode::UU) ? 2 : 1; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3613 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3614 |
// ************************************************************************************************** |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3615 |
// Prepare for main loop: optimized for needle count >=2, bail out otherwise. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3616 |
// ************************************************************************************************** |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3617 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3618 |
// Compute last haystack addr to use if no match gets found. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3619 |
clrldi(haycnt, haycnt, 32); // Ensure positive int is valid as 64 bit value. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3620 |
addi(addr, haystack, -h_csize); // Accesses use pre-increment. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3621 |
if (needlecntval == 0) { // variable needlecnt |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3622 |
cmpwi(CCR6, needlecnt, 2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3623 |
clrldi(needlecnt, needlecnt, 32); // Ensure positive int is valid as 64 bit value. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3624 |
blt(CCR6, L_TooShort); // Variable needlecnt: handle short needle separately. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3625 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3626 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3627 |
if (n_csize == 2) { lwz(n_start, 0, needle); } else { lhz(n_start, 0, needle); } // Load first 2 characters of needle. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3628 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3629 |
if (needlecntval == 0) { // variable needlecnt |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3630 |
subf(ch1, needlecnt, haycnt); // Last character index to compare is haycnt-needlecnt. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3631 |
addi(needlecnt, needlecnt, -2); // Rest of needle. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3632 |
} else { // constant needlecnt |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3633 |
guarantee(needlecntval != 1, "IndexOf with single-character needle must be handled separately"); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3634 |
assert((needlecntval & 0x7fff) == needlecntval, "wrong immediate"); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3635 |
addi(ch1, haycnt, -needlecntval); // Last character index to compare is haycnt-needlecnt. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3636 |
if (needlecntval > 3) { li(needlecnt, needlecntval - 2); } // Rest of needle. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3637 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3638 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3639 |
if (h_csize == 2) { slwi(ch1, ch1, 1); } // Scale to number of bytes. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3640 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3641 |
if (ae ==StrIntrinsicNode::UL) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3642 |
srwi(tmp4, n_start, 1*8); // ___0 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3643 |
rlwimi(n_start, tmp4, 2*8, 0, 23); // _0_1 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3644 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3645 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3646 |
add(last_addr, haystack, ch1); // Point to last address to compare (haystack+2*(haycnt-needlecnt)). |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3647 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3648 |
// Main Loop (now we have at least 2 characters). |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3649 |
Label L_OuterLoop, L_InnerLoop, L_FinalCheck, L_Comp1, L_Comp2; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3650 |
bind(L_OuterLoop); // Search for 1st 2 characters. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3651 |
Register addr_diff = tmp4; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3652 |
subf(addr_diff, addr, last_addr); // Difference between already checked address and last address to check. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3653 |
addi(addr, addr, h_csize); // This is the new address we want to use for comparing. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3654 |
srdi_(ch2, addr_diff, h_csize); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3655 |
beq(CCR0, L_FinalCheck); // 2 characters left? |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3656 |
mtctr(ch2); // num of characters / 2 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3657 |
bind(L_InnerLoop); // Main work horse (2x unrolled search loop) |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3658 |
if (h_csize == 2) { // Load 2 characters of haystack (ignore alignment). |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3659 |
lwz(ch1, 0, addr); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3660 |
lwz(ch2, 2, addr); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3661 |
} else { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3662 |
lhz(ch1, 0, addr); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3663 |
lhz(ch2, 1, addr); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3664 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3665 |
cmpw(CCR0, ch1, n_start); // Compare 2 characters (1 would be sufficient but try to reduce branches to CompLoop). |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3666 |
cmpw(CCR1, ch2, n_start); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3667 |
beq(CCR0, L_Comp1); // Did we find the needle start? |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3668 |
beq(CCR1, L_Comp2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3669 |
addi(addr, addr, 2 * h_csize); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3670 |
bdnz(L_InnerLoop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3671 |
bind(L_FinalCheck); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3672 |
andi_(addr_diff, addr_diff, h_csize); // Remaining characters not covered by InnerLoop: (num of characters) & 1. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3673 |
beq(CCR0, L_NotFound); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3674 |
if (h_csize == 2) { lwz(ch1, 0, addr); } else { lhz(ch1, 0, addr); } // One position left at which we have to compare. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3675 |
cmpw(CCR1, ch1, n_start); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3676 |
beq(CCR1, L_Comp1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3677 |
bind(L_NotFound); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3678 |
li(result, -1); // not found |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3679 |
b(L_End); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3680 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3681 |
// ************************************************************************************************** |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3682 |
// Special Case: unfortunately, the variable needle case can be called with needlecnt<2 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3683 |
// ************************************************************************************************** |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3684 |
if (needlecntval == 0) { // We have to handle these cases separately. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3685 |
Label L_OneCharLoop; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3686 |
bind(L_TooShort); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3687 |
mtctr(haycnt); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3688 |
if (n_csize == 2) { lhz(n_start, 0, needle); } else { lbz(n_start, 0, needle); } // First character of needle |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3689 |
bind(L_OneCharLoop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3690 |
if (h_csize == 2) { lhzu(ch1, 2, addr); } else { lbzu(ch1, 1, addr); } |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3691 |
cmpw(CCR1, ch1, n_start); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3692 |
beq(CCR1, L_Found); // Did we find the one character needle? |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3693 |
bdnz(L_OneCharLoop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3694 |
li(result, -1); // Not found. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3695 |
b(L_End); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3696 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3697 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3698 |
// ************************************************************************************************** |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3699 |
// Regular Case Part II: compare rest of needle (first 2 characters have been compared already) |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3700 |
// ************************************************************************************************** |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3701 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3702 |
// Compare the rest |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3703 |
bind(L_Comp2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3704 |
addi(addr, addr, h_csize); // First comparison has failed, 2nd one hit. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3705 |
bind(L_Comp1); // Addr points to possible needle start. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3706 |
if (needlecntval != 2) { // Const needlecnt==2? |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3707 |
if (needlecntval != 3) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3708 |
if (needlecntval == 0) { beq(CCR6, L_Found); } // Variable needlecnt==2? |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3709 |
Register n_ind = tmp4, |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3710 |
h_ind = n_ind; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3711 |
li(n_ind, 2 * n_csize); // First 2 characters are already compared, use index 2. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3712 |
mtctr(needlecnt); // Decremented by 2, still > 0. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3713 |
Label L_CompLoop; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3714 |
bind(L_CompLoop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3715 |
if (ae ==StrIntrinsicNode::UL) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3716 |
h_ind = ch1; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3717 |
sldi(h_ind, n_ind, 1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3718 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3719 |
if (n_csize == 2) { lhzx(ch2, needle, n_ind); } else { lbzx(ch2, needle, n_ind); } |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3720 |
if (h_csize == 2) { lhzx(ch1, addr, h_ind); } else { lbzx(ch1, addr, h_ind); } |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3721 |
cmpw(CCR1, ch1, ch2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3722 |
bne(CCR1, L_OuterLoop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3723 |
addi(n_ind, n_ind, n_csize); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3724 |
bdnz(L_CompLoop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3725 |
} else { // No loop required if there's only one needle character left. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3726 |
if (n_csize == 2) { lhz(ch2, 2 * 2, needle); } else { lbz(ch2, 2 * 1, needle); } |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3727 |
if (h_csize == 2) { lhz(ch1, 2 * 2, addr); } else { lbz(ch1, 2 * 1, addr); } |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3728 |
cmpw(CCR1, ch1, ch2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3729 |
bne(CCR1, L_OuterLoop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3730 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3731 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3732 |
// Return index ... |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3733 |
bind(L_Found); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3734 |
subf(result, haystack, addr); // relative to haystack, ... |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3735 |
if (h_csize == 2) { srdi(result, result, 1); } // in characters. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3736 |
bind(L_End); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3737 |
} // string_indexof |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3738 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3739 |
void MacroAssembler::string_indexof_char(Register result, Register haystack, Register haycnt, |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3740 |
Register needle, jchar needleChar, Register tmp1, Register tmp2, bool is_byte) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3741 |
assert_different_registers(haystack, haycnt, needle, tmp1, tmp2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3742 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3743 |
Label L_InnerLoop, L_FinalCheck, L_Found1, L_Found2, L_NotFound, L_End; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3744 |
Register addr = tmp1, |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3745 |
ch1 = tmp2, |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3746 |
ch2 = R0; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3747 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3748 |
const int h_csize = is_byte ? 1 : 2; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3749 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3750 |
//4: |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3751 |
srwi_(tmp2, haycnt, 1); // Shift right by exact_log2(UNROLL_FACTOR). |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3752 |
mr(addr, haystack); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3753 |
beq(CCR0, L_FinalCheck); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3754 |
mtctr(tmp2); // Move to count register. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3755 |
//8: |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3756 |
bind(L_InnerLoop); // Main work horse (2x unrolled search loop). |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3757 |
if (!is_byte) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3758 |
lhz(ch1, 0, addr); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3759 |
lhz(ch2, 2, addr); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3760 |
} else { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3761 |
lbz(ch1, 0, addr); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3762 |
lbz(ch2, 1, addr); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3763 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3764 |
(needle != R0) ? cmpw(CCR0, ch1, needle) : cmplwi(CCR0, ch1, (unsigned int)needleChar); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3765 |
(needle != R0) ? cmpw(CCR1, ch2, needle) : cmplwi(CCR1, ch2, (unsigned int)needleChar); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3766 |
beq(CCR0, L_Found1); // Did we find the needle? |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3767 |
beq(CCR1, L_Found2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3768 |
addi(addr, addr, 2 * h_csize); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3769 |
bdnz(L_InnerLoop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3770 |
//16: |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3771 |
bind(L_FinalCheck); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3772 |
andi_(R0, haycnt, 1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3773 |
beq(CCR0, L_NotFound); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3774 |
if (!is_byte) { lhz(ch1, 0, addr); } else { lbz(ch1, 0, addr); } // One position left at which we have to compare. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3775 |
(needle != R0) ? cmpw(CCR1, ch1, needle) : cmplwi(CCR1, ch1, (unsigned int)needleChar); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3776 |
beq(CCR1, L_Found1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3777 |
//21: |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3778 |
bind(L_NotFound); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3779 |
li(result, -1); // Not found. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3780 |
b(L_End); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3781 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3782 |
bind(L_Found2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3783 |
addi(addr, addr, h_csize); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3784 |
//24: |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3785 |
bind(L_Found1); // Return index ... |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3786 |
subf(result, haystack, addr); // relative to haystack, ... |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3787 |
if (!is_byte) { srdi(result, result, 1); } // in characters. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3788 |
bind(L_End); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3789 |
} // string_indexof_char |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3790 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3791 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3792 |
void MacroAssembler::has_negatives(Register src, Register cnt, Register result, |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3793 |
Register tmp1, Register tmp2) { |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3794 |
const Register tmp0 = R0; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3795 |
assert_different_registers(src, result, cnt, tmp0, tmp1, tmp2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3796 |
Label Lfastloop, Lslow, Lloop, Lnoneg, Ldone; |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3797 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3798 |
// Check if cnt >= 8 (= 16 bytes) |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3799 |
lis(tmp1, (int)(short)0x8080); // tmp1 = 0x8080808080808080 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3800 |
srwi_(tmp2, cnt, 4); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3801 |
li(result, 1); // Assume there's a negative byte. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3802 |
beq(CCR0, Lslow); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3803 |
ori(tmp1, tmp1, 0x8080); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3804 |
rldimi(tmp1, tmp1, 32, 0); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3805 |
mtctr(tmp2); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3806 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3807 |
// 2x unrolled loop |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3808 |
bind(Lfastloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3809 |
ld(tmp2, 0, src); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3810 |
ld(tmp0, 8, src); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3811 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3812 |
orr(tmp0, tmp2, tmp0); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3813 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3814 |
and_(tmp0, tmp0, tmp1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3815 |
bne(CCR0, Ldone); // Found negative byte. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3816 |
addi(src, src, 16); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3817 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3818 |
bdnz(Lfastloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3819 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3820 |
bind(Lslow); // Fallback to slow version |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3821 |
rldicl_(tmp0, cnt, 0, 64-4); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3822 |
beq(CCR0, Lnoneg); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3823 |
mtctr(tmp0); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3824 |
bind(Lloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3825 |
lbz(tmp0, 0, src); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3826 |
addi(src, src, 1); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3827 |
andi_(tmp0, tmp0, 0x80); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3828 |
bne(CCR0, Ldone); // Found negative byte. |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3829 |
bdnz(Lloop); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3830 |
bind(Lnoneg); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3831 |
li(result, 0); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3832 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3833 |
bind(Ldone); |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3834 |
} |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3835 |
|
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3836 |
#endif // Compiler2 |
6241574f5982
8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents:
35913
diff
changeset
|
3837 |
|
31861 | 3838 |
// Helpers for Intrinsic Emitters |
3839 |
// |
|
3840 |
// Revert the byte order of a 32bit value in a register |
|
3841 |
// src: 0x44556677 |
|
3842 |
// dst: 0x77665544 |
|
3843 |
// Three steps to obtain the result: |
|
3844 |
// 1) Rotate src (as doubleword) left 5 bytes. That puts the leftmost byte of the src word |
|
3845 |
// into the rightmost byte position. Afterwards, everything left of the rightmost byte is cleared. |
|
3846 |
// This value initializes dst. |
|
3847 |
// 2) Rotate src (as word) left 3 bytes. That puts the rightmost byte of the src word into the leftmost |
|
3848 |
// byte position. Furthermore, byte 5 is rotated into byte 6 position where it is supposed to go. |
|
3849 |
// This value is mask inserted into dst with a [0..23] mask of 1s. |
|
3850 |
// 3) Rotate src (as word) left 1 byte. That puts byte 6 into byte 5 position. |
|
3851 |
// This value is mask inserted into dst with a [8..15] mask of 1s. |
|
3852 |
void MacroAssembler::load_reverse_32(Register dst, Register src) { |
|
3853 |
assert_different_registers(dst, src); |
|
3854 |
||
3855 |
rldicl(dst, src, (4+1)*8, 56); // Rotate byte 4 into position 7 (rightmost), clear all to the left. |
|
3856 |
rlwimi(dst, src, 3*8, 0, 23); // Insert byte 5 into position 6, 7 into 4, leave pos 7 alone. |
|
3857 |
rlwimi(dst, src, 1*8, 8, 15); // Insert byte 6 into position 5, leave the rest alone. |
|
3858 |
} |
|
3859 |
||
3860 |
// Calculate the column addresses of the crc32 lookup table into distinct registers. |
|
3861 |
// This loop-invariant calculation is moved out of the loop body, reducing the loop |
|
3862 |
// body size from 20 to 16 instructions. |
|
3863 |
// Returns the offset that was used to calculate the address of column tc3. |
|
3864 |
// Due to register shortage, setting tc3 may overwrite table. With the return offset |
|
3865 |
// at hand, the original table address can be easily reconstructed. |
|
3866 |
int MacroAssembler::crc32_table_columns(Register table, Register tc0, Register tc1, Register tc2, Register tc3) { |
|
3867 |
||
3868 |
#ifdef VM_LITTLE_ENDIAN |
|
3869 |
// This is what we implement (the DOLIT4 part): |
|
3870 |
// ========================================================================= */ |
|
3871 |
// #define DOLIT4 c ^= *buf4++; \ |
|
3872 |
// c = crc_table[3][c & 0xff] ^ crc_table[2][(c >> 8) & 0xff] ^ \ |
|
3873 |
// crc_table[1][(c >> 16) & 0xff] ^ crc_table[0][c >> 24] |
|
3874 |
// #define DOLIT32 DOLIT4; DOLIT4; DOLIT4; DOLIT4; DOLIT4; DOLIT4; DOLIT4; DOLIT4 |
|
3875 |
// ========================================================================= */ |
|
3876 |
const int ix0 = 3*(4*CRC32_COLUMN_SIZE); |
|
3877 |
const int ix1 = 2*(4*CRC32_COLUMN_SIZE); |
|
3878 |
const int ix2 = 1*(4*CRC32_COLUMN_SIZE); |
|
3879 |
const int ix3 = 0*(4*CRC32_COLUMN_SIZE); |
|
3880 |
#else |
|
3881 |
// This is what we implement (the DOBIG4 part): |
|
3882 |
// ========================================================================= |
|
3883 |
// #define DOBIG4 c ^= *++buf4; \ |
|
3884 |
// c = crc_table[4][c & 0xff] ^ crc_table[5][(c >> 8) & 0xff] ^ \ |
|
3885 |
// crc_table[6][(c >> 16) & 0xff] ^ crc_table[7][c >> 24] |
|
3886 |
// #define DOBIG32 DOBIG4; DOBIG4; DOBIG4; DOBIG4; DOBIG4; DOBIG4; DOBIG4; DOBIG4 |
|
3887 |
// ========================================================================= |
|
3888 |
const int ix0 = 4*(4*CRC32_COLUMN_SIZE); |
|
3889 |
const int ix1 = 5*(4*CRC32_COLUMN_SIZE); |
|
3890 |
const int ix2 = 6*(4*CRC32_COLUMN_SIZE); |
|
3891 |
const int ix3 = 7*(4*CRC32_COLUMN_SIZE); |
|
3892 |
#endif |
|
3893 |
assert_different_registers(table, tc0, tc1, tc2); |
|
3894 |
assert(table == tc3, "must be!"); |
|
3895 |
||
35541
cba047a086d5
8146613: PPC64: C2 does no longer respect int to long conversion for stub calls
mdoerr
parents:
35085
diff
changeset
|
3896 |
addi(tc0, table, ix0); |
cba047a086d5
8146613: PPC64: C2 does no longer respect int to long conversion for stub calls
mdoerr
parents:
35085
diff
changeset
|
3897 |
addi(tc1, table, ix1); |
cba047a086d5
8146613: PPC64: C2 does no longer respect int to long conversion for stub calls
mdoerr
parents:
35085
diff
changeset
|
3898 |
addi(tc2, table, ix2); |
31861 | 3899 |
if (ix3 != 0) addi(tc3, table, ix3); |
3900 |
||
3901 |
return ix3; |
|
3902 |
} |
|
3903 |
||
3904 |
/** |
|
3905 |
* uint32_t crc; |
|
3906 |
* timesXtoThe32[crc & 0xFF] ^ (crc >> 8); |
|
3907 |
*/ |
|
3908 |
void MacroAssembler::fold_byte_crc32(Register crc, Register val, Register table, Register tmp) { |
|
3909 |
assert_different_registers(crc, table, tmp); |
|
3910 |
assert_different_registers(val, table); |
|
3911 |
||
3912 |
if (crc == val) { // Must rotate first to use the unmodified value. |
|
3913 |
rlwinm(tmp, val, 2, 24-2, 31-2); // Insert (rightmost) byte 7 of val, shifted left by 2, into byte 6..7 of tmp, clear the rest. |
|
3914 |
// As we use a word (4-byte) instruction, we have to adapt the mask bit positions. |
|
3915 |
srwi(crc, crc, 8); // Unsigned shift, clear leftmost 8 bits. |
|
3916 |
} else { |
|
3917 |
srwi(crc, crc, 8); // Unsigned shift, clear leftmost 8 bits. |
|
3918 |
rlwinm(tmp, val, 2, 24-2, 31-2); // Insert (rightmost) byte 7 of val, shifted left by 2, into byte 6..7 of tmp, clear the rest. |
|
3919 |
} |
|
3920 |
lwzx(tmp, table, tmp); |
|
3921 |
xorr(crc, crc, tmp); |
|
3922 |
} |
|
3923 |
||
3924 |
/** |
|
3925 |
* uint32_t crc; |
|
3926 |
* timesXtoThe32[crc & 0xFF] ^ (crc >> 8); |
|
3927 |
*/ |
|
3928 |
void MacroAssembler::fold_8bit_crc32(Register crc, Register table, Register tmp) { |
|
3929 |
fold_byte_crc32(crc, crc, table, tmp); |
|
3930 |
} |
|
3931 |
||
3932 |
/** |
|
3933 |
* Emits code to update CRC-32 with a byte value according to constants in table. |
|
3934 |
* |
|
3935 |
* @param [in,out]crc Register containing the crc. |
|
3936 |
* @param [in]val Register containing the byte to fold into the CRC. |
|
3937 |
* @param [in]table Register containing the table of crc constants. |
|
3938 |
* |
|
3939 |
* uint32_t crc; |
|
3940 |
* val = crc_table[(val ^ crc) & 0xFF]; |
|
3941 |
* crc = val ^ (crc >> 8); |
|
3942 |
*/ |
|
3943 |
void MacroAssembler::update_byte_crc32(Register crc, Register val, Register table) { |
|
3944 |
BLOCK_COMMENT("update_byte_crc32:"); |
|
3945 |
xorr(val, val, crc); |
|
3946 |
fold_byte_crc32(crc, val, table, val); |
|
3947 |
} |
|
3948 |
||
3949 |
/** |
|
3950 |
* @param crc register containing existing CRC (32-bit) |
|
3951 |
* @param buf register pointing to input byte buffer (byte*) |
|
3952 |
* @param len register containing number of bytes |
|
3953 |
* @param table register pointing to CRC table |
|
3954 |
*/ |
|
3955 |
void MacroAssembler::update_byteLoop_crc32(Register crc, Register buf, Register len, Register table, |
|
46317
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
3956 |
Register data, bool loopAlignment) { |
31861 | 3957 |
assert_different_registers(crc, buf, len, table, data); |
3958 |
||
3959 |
Label L_mainLoop, L_done; |
|
3960 |
const int mainLoop_stepping = 1; |
|
3961 |
const int mainLoop_alignment = loopAlignment ? 32 : 4; // (InputForNewCode > 4 ? InputForNewCode : 32) : 4; |
|
3962 |
||
3963 |
// Process all bytes in a single-byte loop. |
|
35541
cba047a086d5
8146613: PPC64: C2 does no longer respect int to long conversion for stub calls
mdoerr
parents:
35085
diff
changeset
|
3964 |
clrldi_(len, len, 32); // Enforce 32 bit. Anything to do? |
31861 | 3965 |
beq(CCR0, L_done); |
3966 |
||
35541
cba047a086d5
8146613: PPC64: C2 does no longer respect int to long conversion for stub calls
mdoerr
parents:
35085
diff
changeset
|
3967 |
mtctr(len); |
31861 | 3968 |
align(mainLoop_alignment); |
3969 |
BIND(L_mainLoop); |
|
3970 |
lbz(data, 0, buf); // Byte from buffer, zero-extended. |
|
3971 |
addi(buf, buf, mainLoop_stepping); // Advance buffer position. |
|
3972 |
update_byte_crc32(crc, data, table); |
|
3973 |
bdnz(L_mainLoop); // Iterate. |
|
3974 |
||
3975 |
bind(L_done); |
|
3976 |
} |
|
3977 |
||
3978 |
/** |
|
3979 |
* Emits code to update CRC-32 with a 4-byte value according to constants in table |
|
3980 |
* Implementation according to jdk/src/share/native/java/util/zip/zlib-1.2.8/crc32.c |
|
3981 |
*/ |
|
3982 |
// A not on the lookup table address(es): |
|
3983 |
// The lookup table consists of two sets of four columns each. |
|
3984 |
// The columns {0..3} are used for little-endian machines. |
|
3985 |
// The columns {4..7} are used for big-endian machines. |
|
3986 |
// To save the effort of adding the column offset to the table address each time |
|
3987 |
// a table element is looked up, it is possible to pass the pre-calculated |
|
3988 |
// column addresses. |
|
3989 |
// Uses R9..R12 as work register. Must be saved/restored by caller, if necessary. |
|
3990 |
void MacroAssembler::update_1word_crc32(Register crc, Register buf, Register table, int bufDisp, int bufInc, |
|
3991 |
Register t0, Register t1, Register t2, Register t3, |
|
3992 |
Register tc0, Register tc1, Register tc2, Register tc3) { |
|
3993 |
assert_different_registers(crc, t3); |
|
3994 |
||
3995 |
// XOR crc with next four bytes of buffer. |
|
3996 |
lwz(t3, bufDisp, buf); |
|
3997 |
if (bufInc != 0) { |
|
3998 |
addi(buf, buf, bufInc); |
|
3999 |
} |
|
4000 |
xorr(t3, t3, crc); |
|
4001 |
||
4002 |
// Chop crc into 4 single-byte pieces, shifted left 2 bits, to form the table indices. |
|
4003 |
rlwinm(t0, t3, 2, 24-2, 31-2); // ((t1 >> 0) & 0xff) << 2 |
|
4004 |
rlwinm(t1, t3, 32+(2- 8), 24-2, 31-2); // ((t1 >> 8) & 0xff) << 2 |
|
4005 |
rlwinm(t2, t3, 32+(2-16), 24-2, 31-2); // ((t1 >> 16) & 0xff) << 2 |
|
4006 |
rlwinm(t3, t3, 32+(2-24), 24-2, 31-2); // ((t1 >> 24) & 0xff) << 2 |
|
4007 |
||
4008 |
// Use the pre-calculated column addresses. |
|
4009 |
// Load pre-calculated table values. |
|
4010 |
lwzx(t0, tc0, t0); |
|
4011 |
lwzx(t1, tc1, t1); |
|
4012 |
lwzx(t2, tc2, t2); |
|
4013 |
lwzx(t3, tc3, t3); |
|
4014 |
||
4015 |
// Calculate new crc from table values. |
|
4016 |
xorr(t0, t0, t1); |
|
4017 |
xorr(t2, t2, t3); |
|
4018 |
xorr(crc, t0, t2); // Now crc contains the final checksum value. |
|
4019 |
} |
|
4020 |
||
4021 |
/** |
|
4022 |
* @param crc register containing existing CRC (32-bit) |
|
4023 |
* @param buf register pointing to input byte buffer (byte*) |
|
4024 |
* @param len register containing number of bytes |
|
4025 |
* @param table register pointing to CRC table |
|
4026 |
* |
|
4027 |
* Uses R9..R12 as work register. Must be saved/restored by caller! |
|
4028 |
*/ |
|
4029 |
void MacroAssembler::kernel_crc32_2word(Register crc, Register buf, Register len, Register table, |
|
4030 |
Register t0, Register t1, Register t2, Register t3, |
|
46317
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4031 |
Register tc0, Register tc1, Register tc2, Register tc3, |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4032 |
bool invertCRC) { |
31861 | 4033 |
assert_different_registers(crc, buf, len, table); |
4034 |
||
4035 |
Label L_mainLoop, L_tail; |
|
4036 |
Register tmp = t0; |
|
4037 |
Register data = t0; |
|
4038 |
Register tmp2 = t1; |
|
4039 |
const int mainLoop_stepping = 8; |
|
4040 |
const int tailLoop_stepping = 1; |
|
4041 |
const int log_stepping = exact_log2(mainLoop_stepping); |
|
4042 |
const int mainLoop_alignment = 32; // InputForNewCode > 4 ? InputForNewCode : 32; |
|
4043 |
const int complexThreshold = 2*mainLoop_stepping; |
|
4044 |
||
4045 |
// Don't test for len <= 0 here. This pathological case should not occur anyway. |
|
46317
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4046 |
// Optimizing for it by adding a test and a branch seems to be a waste of CPU cycles |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4047 |
// for all well-behaved cases. The situation itself is detected and handled correctly |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4048 |
// within update_byteLoop_crc32. |
31861 | 4049 |
assert(tailLoop_stepping == 1, "check tailLoop_stepping!"); |
4050 |
||
4051 |
BLOCK_COMMENT("kernel_crc32_2word {"); |
|
4052 |
||
46317
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4053 |
if (invertCRC) { |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4054 |
nand(crc, crc, crc); // 1s complement of crc |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4055 |
} |
31861 | 4056 |
|
4057 |
// Check for short (<mainLoop_stepping) buffer. |
|
4058 |
cmpdi(CCR0, len, complexThreshold); |
|
4059 |
blt(CCR0, L_tail); |
|
4060 |
||
4061 |
// Pre-mainLoop alignment did show a slight (1%) positive effect on performance. |
|
4062 |
// We leave the code in for reference. Maybe we need alignment when we exploit vector instructions. |
|
4063 |
{ |
|
4064 |
// Align buf addr to mainLoop_stepping boundary. |
|
4065 |
neg(tmp2, buf); // Calculate # preLoop iterations for alignment. |
|
4066 |
rldicl(tmp2, tmp2, 0, 64-log_stepping); // Rotate tmp2 0 bits, insert into tmp2, anding with mask with 1s from 62..63. |
|
4067 |
||
4068 |
if (complexThreshold > mainLoop_stepping) { |
|
4069 |
sub(len, len, tmp2); // Remaining bytes for main loop (>=mainLoop_stepping is guaranteed). |
|
4070 |
} else { |
|
4071 |
sub(tmp, len, tmp2); // Remaining bytes for main loop. |
|
4072 |
cmpdi(CCR0, tmp, mainLoop_stepping); |
|
4073 |
blt(CCR0, L_tail); // For less than one mainloop_stepping left, do only tail processing |
|
4074 |
mr(len, tmp); // remaining bytes for main loop (>=mainLoop_stepping is guaranteed). |
|
4075 |
} |
|
46317
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4076 |
update_byteLoop_crc32(crc, buf, tmp2, table, data, false); |
31861 | 4077 |
} |
4078 |
||
4079 |
srdi(tmp2, len, log_stepping); // #iterations for mainLoop |
|
4080 |
andi(len, len, mainLoop_stepping-1); // remaining bytes for tailLoop |
|
4081 |
mtctr(tmp2); |
|
4082 |
||
4083 |
#ifdef VM_LITTLE_ENDIAN |
|
4084 |
Register crc_rv = crc; |
|
4085 |
#else |
|
4086 |
Register crc_rv = tmp; // Load_reverse needs separate registers to work on. |
|
4087 |
// Occupies tmp, but frees up crc. |
|
4088 |
load_reverse_32(crc_rv, crc); // Revert byte order because we are dealing with big-endian data. |
|
4089 |
tmp = crc; |
|
4090 |
#endif |
|
4091 |
||
4092 |
int reconstructTableOffset = crc32_table_columns(table, tc0, tc1, tc2, tc3); |
|
4093 |
||
4094 |
align(mainLoop_alignment); // Octoword-aligned loop address. Shows 2% improvement. |
|
4095 |
BIND(L_mainLoop); |
|
4096 |
update_1word_crc32(crc_rv, buf, table, 0, 0, crc_rv, t1, t2, t3, tc0, tc1, tc2, tc3); |
|
4097 |
update_1word_crc32(crc_rv, buf, table, 4, mainLoop_stepping, crc_rv, t1, t2, t3, tc0, tc1, tc2, tc3); |
|
4098 |
bdnz(L_mainLoop); |
|
4099 |
||
4100 |
#ifndef VM_LITTLE_ENDIAN |
|
4101 |
load_reverse_32(crc, crc_rv); // Revert byte order because we are dealing with big-endian data. |
|
4102 |
tmp = crc_rv; // Tmp uses it's original register again. |
|
4103 |
#endif |
|
4104 |
||
4105 |
// Restore original table address for tailLoop. |
|
4106 |
if (reconstructTableOffset != 0) { |
|
4107 |
addi(table, table, -reconstructTableOffset); |
|
4108 |
} |
|
4109 |
||
4110 |
// Process last few (<complexThreshold) bytes of buffer. |
|
4111 |
BIND(L_tail); |
|
46317
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4112 |
update_byteLoop_crc32(crc, buf, len, table, data, false); |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4113 |
|
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4114 |
if (invertCRC) { |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4115 |
nand(crc, crc, crc); // 1s complement of crc |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4116 |
} |
31861 | 4117 |
BLOCK_COMMENT("} kernel_crc32_2word"); |
4118 |
} |
|
4119 |
||
4120 |
/** |
|
4121 |
* @param crc register containing existing CRC (32-bit) |
|
4122 |
* @param buf register pointing to input byte buffer (byte*) |
|
4123 |
* @param len register containing number of bytes |
|
4124 |
* @param table register pointing to CRC table |
|
4125 |
* |
|
4126 |
* uses R9..R12 as work register. Must be saved/restored by caller! |
|
4127 |
*/ |
|
4128 |
void MacroAssembler::kernel_crc32_1word(Register crc, Register buf, Register len, Register table, |
|
4129 |
Register t0, Register t1, Register t2, Register t3, |
|
46317
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4130 |
Register tc0, Register tc1, Register tc2, Register tc3, |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4131 |
bool invertCRC) { |
31861 | 4132 |
assert_different_registers(crc, buf, len, table); |
4133 |
||
4134 |
Label L_mainLoop, L_tail; |
|
4135 |
Register tmp = t0; |
|
4136 |
Register data = t0; |
|
4137 |
Register tmp2 = t1; |
|
4138 |
const int mainLoop_stepping = 4; |
|
4139 |
const int tailLoop_stepping = 1; |
|
4140 |
const int log_stepping = exact_log2(mainLoop_stepping); |
|
4141 |
const int mainLoop_alignment = 32; // InputForNewCode > 4 ? InputForNewCode : 32; |
|
4142 |
const int complexThreshold = 2*mainLoop_stepping; |
|
4143 |
||
4144 |
// Don't test for len <= 0 here. This pathological case should not occur anyway. |
|
46317
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4145 |
// Optimizing for it by adding a test and a branch seems to be a waste of CPU cycles |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4146 |
// for all well-behaved cases. The situation itself is detected and handled correctly |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4147 |
// within update_byteLoop_crc32. |
31861 | 4148 |
assert(tailLoop_stepping == 1, "check tailLoop_stepping!"); |
4149 |
||
4150 |
BLOCK_COMMENT("kernel_crc32_1word {"); |
|
4151 |
||
46317
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4152 |
if (invertCRC) { |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4153 |
nand(crc, crc, crc); // 1s complement of crc |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4154 |
} |
31861 | 4155 |
|
4156 |
// Check for short (<mainLoop_stepping) buffer. |
|
4157 |
cmpdi(CCR0, len, complexThreshold); |
|
4158 |
blt(CCR0, L_tail); |
|
4159 |
||
4160 |
// Pre-mainLoop alignment did show a slight (1%) positive effect on performance. |
|
4161 |
// We leave the code in for reference. Maybe we need alignment when we exploit vector instructions. |
|
4162 |
{ |
|
4163 |
// Align buf addr to mainLoop_stepping boundary. |
|
4164 |
neg(tmp2, buf); // Calculate # preLoop iterations for alignment. |
|
4165 |
rldicl(tmp2, tmp2, 0, 64-log_stepping); // Rotate tmp2 0 bits, insert into tmp2, anding with mask with 1s from 62..63. |
|
4166 |
||
4167 |
if (complexThreshold > mainLoop_stepping) { |
|
4168 |
sub(len, len, tmp2); // Remaining bytes for main loop (>=mainLoop_stepping is guaranteed). |
|
4169 |
} else { |
|
4170 |
sub(tmp, len, tmp2); // Remaining bytes for main loop. |
|
4171 |
cmpdi(CCR0, tmp, mainLoop_stepping); |
|
4172 |
blt(CCR0, L_tail); // For less than one mainloop_stepping left, do only tail processing |
|
4173 |
mr(len, tmp); // remaining bytes for main loop (>=mainLoop_stepping is guaranteed). |
|
4174 |
} |
|
46317
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4175 |
update_byteLoop_crc32(crc, buf, tmp2, table, data, false); |
31861 | 4176 |
} |
4177 |
||
4178 |
srdi(tmp2, len, log_stepping); // #iterations for mainLoop |
|
4179 |
andi(len, len, mainLoop_stepping-1); // remaining bytes for tailLoop |
|
4180 |
mtctr(tmp2); |
|
4181 |
||
4182 |
#ifdef VM_LITTLE_ENDIAN |
|
4183 |
Register crc_rv = crc; |
|
4184 |
#else |
|
4185 |
Register crc_rv = tmp; // Load_reverse needs separate registers to work on. |
|
4186 |
// Occupies tmp, but frees up crc. |
|
35541
cba047a086d5
8146613: PPC64: C2 does no longer respect int to long conversion for stub calls
mdoerr
parents:
35085
diff
changeset
|
4187 |
load_reverse_32(crc_rv, crc); // Revert byte order because we are dealing with big-endian data. |
31861 | 4188 |
tmp = crc; |
4189 |
#endif |
|
4190 |
||
4191 |
int reconstructTableOffset = crc32_table_columns(table, tc0, tc1, tc2, tc3); |
|
4192 |
||
4193 |
align(mainLoop_alignment); // Octoword-aligned loop address. Shows 2% improvement. |
|
4194 |
BIND(L_mainLoop); |
|
4195 |
update_1word_crc32(crc_rv, buf, table, 0, mainLoop_stepping, crc_rv, t1, t2, t3, tc0, tc1, tc2, tc3); |
|
4196 |
bdnz(L_mainLoop); |
|
4197 |
||
4198 |
#ifndef VM_LITTLE_ENDIAN |
|
4199 |
load_reverse_32(crc, crc_rv); // Revert byte order because we are dealing with big-endian data. |
|
4200 |
tmp = crc_rv; // Tmp uses it's original register again. |
|
4201 |
#endif |
|
4202 |
||
4203 |
// Restore original table address for tailLoop. |
|
4204 |
if (reconstructTableOffset != 0) { |
|
4205 |
addi(table, table, -reconstructTableOffset); |
|
4206 |
} |
|
4207 |
||
4208 |
// Process last few (<complexThreshold) bytes of buffer. |
|
4209 |
BIND(L_tail); |
|
46317
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4210 |
update_byteLoop_crc32(crc, buf, len, table, data, false); |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4211 |
|
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4212 |
if (invertCRC) { |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4213 |
nand(crc, crc, crc); // 1s complement of crc |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4214 |
} |
31861 | 4215 |
BLOCK_COMMENT("} kernel_crc32_1word"); |
4216 |
} |
|
4217 |
||
4218 |
/** |
|
4219 |
* @param crc register containing existing CRC (32-bit) |
|
4220 |
* @param buf register pointing to input byte buffer (byte*) |
|
4221 |
* @param len register containing number of bytes |
|
4222 |
* @param table register pointing to CRC table |
|
4223 |
* |
|
4224 |
* Uses R7_ARG5, R8_ARG6 as work registers. |
|
4225 |
*/ |
|
4226 |
void MacroAssembler::kernel_crc32_1byte(Register crc, Register buf, Register len, Register table, |
|
46317
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4227 |
Register t0, Register t1, Register t2, Register t3, |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4228 |
bool invertCRC) { |
31861 | 4229 |
assert_different_registers(crc, buf, len, table); |
4230 |
||
4231 |
Register data = t0; // Holds the current byte to be folded into crc. |
|
4232 |
||
4233 |
BLOCK_COMMENT("kernel_crc32_1byte {"); |
|
4234 |
||
46317
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4235 |
if (invertCRC) { |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4236 |
nand(crc, crc, crc); // 1s complement of crc |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4237 |
} |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4238 |
|
31861 | 4239 |
// Process all bytes in a single-byte loop. |
46317
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4240 |
update_byteLoop_crc32(crc, buf, len, table, data, true); |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4241 |
|
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4242 |
if (invertCRC) { |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4243 |
nand(crc, crc, crc); // 1s complement of crc |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4244 |
} |
31861 | 4245 |
BLOCK_COMMENT("} kernel_crc32_1byte"); |
4246 |
} |
|
4247 |
||
41334 | 4248 |
/** |
4249 |
* @param crc register containing existing CRC (32-bit) |
|
4250 |
* @param buf register pointing to input byte buffer (byte*) |
|
4251 |
* @param len register containing number of bytes |
|
4252 |
* @param table register pointing to CRC table |
|
4253 |
* @param constants register pointing to CRC table for 128-bit aligned memory |
|
4254 |
* @param barretConstants register pointing to table for barrett reduction |
|
49376
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4255 |
* @param t0-t4 temp registers |
41334 | 4256 |
*/ |
49376
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4257 |
void MacroAssembler::kernel_crc32_1word_vpmsum(Register crc, Register buf, Register len, Register table, |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4258 |
Register constants, Register barretConstants, |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4259 |
Register t0, Register t1, Register t2, Register t3, Register t4, |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4260 |
bool invertCRC) { |
41334 | 4261 |
assert_different_registers(crc, buf, len, table); |
4262 |
||
49376
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4263 |
Label L_alignedHead, L_tail; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4264 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4265 |
BLOCK_COMMENT("kernel_crc32_1word_vpmsum {"); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4266 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4267 |
// 1. ~c |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4268 |
if (invertCRC) { |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4269 |
nand(crc, crc, crc); // 1s complement of crc |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4270 |
} |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4271 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4272 |
// 2. use kernel_crc32_1word for short len |
41334 | 4273 |
clrldi(len, len, 32); |
49376
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4274 |
cmpdi(CCR0, len, 512); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4275 |
blt(CCR0, L_tail); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4276 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4277 |
// 3. calculate from 0 to first aligned address |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4278 |
const int alignment = 16; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4279 |
Register prealign = t0; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4280 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4281 |
andi_(prealign, buf, alignment - 1); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4282 |
beq(CCR0, L_alignedHead); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4283 |
subfic(prealign, prealign, alignment); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4284 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4285 |
subf(len, prealign, len); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4286 |
update_byteLoop_crc32(crc, buf, prealign, table, t2, false); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4287 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4288 |
// 4. calculate from first aligned address as far as possible |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4289 |
BIND(L_alignedHead); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4290 |
kernel_crc32_1word_aligned(crc, buf, len, constants, barretConstants, t0, t1, t2, t3, t4); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4291 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4292 |
// 5. remaining bytes |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4293 |
BIND(L_tail); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4294 |
Register tc0 = t4; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4295 |
Register tc1 = constants; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4296 |
Register tc2 = barretConstants; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4297 |
kernel_crc32_1word(crc, buf, len, table, t0, t1, t2, t3, tc0, tc1, tc2, table, false); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4298 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4299 |
// 6. ~c |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4300 |
if (invertCRC) { |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4301 |
nand(crc, crc, crc); // 1s complement of crc |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4302 |
} |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4303 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4304 |
BLOCK_COMMENT("} kernel_crc32_1word_vpmsum"); |
41334 | 4305 |
} |
4306 |
||
4307 |
/** |
|
4308 |
* @param crc register containing existing CRC (32-bit) |
|
4309 |
* @param buf register pointing to input byte buffer (byte*) |
|
49376
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4310 |
* @param len register containing number of bytes (will get updated to remaining bytes) |
41334 | 4311 |
* @param constants register pointing to CRC table for 128-bit aligned memory |
4312 |
* @param barretConstants register pointing to table for barrett reduction |
|
49376
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4313 |
* @param t0-t4 temp registers |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4314 |
* Precondition: len should be >= 512. Otherwise, nothing will be done. |
41334 | 4315 |
*/ |
4316 |
void MacroAssembler::kernel_crc32_1word_aligned(Register crc, Register buf, Register len, |
|
49376
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4317 |
Register constants, Register barretConstants, |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4318 |
Register t0, Register t1, Register t2, Register t3, Register t4) { |
41334 | 4319 |
|
4320 |
// Save non-volatile vector registers (frameless). |
|
49376
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4321 |
Register offset = t1; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4322 |
int offsetInt = 0; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4323 |
offsetInt -= 16; li(offset, offsetInt); stvx(VR20, offset, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4324 |
offsetInt -= 16; li(offset, offsetInt); stvx(VR21, offset, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4325 |
offsetInt -= 16; li(offset, offsetInt); stvx(VR22, offset, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4326 |
offsetInt -= 16; li(offset, offsetInt); stvx(VR23, offset, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4327 |
offsetInt -= 16; li(offset, offsetInt); stvx(VR24, offset, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4328 |
offsetInt -= 16; li(offset, offsetInt); stvx(VR25, offset, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4329 |
#ifndef VM_LITTLE_ENDIAN |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4330 |
offsetInt -= 16; li(offset, offsetInt); stvx(VR26, offset, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4331 |
#endif |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4332 |
offsetInt -= 8; std(R14, offsetInt, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4333 |
offsetInt -= 8; std(R15, offsetInt, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4334 |
offsetInt -= 8; std(R16, offsetInt, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4335 |
offsetInt -= 8; std(R17, offsetInt, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4336 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4337 |
// Implementation uses an inner loop which uses between 256 and 16 * unroll_factor |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4338 |
// bytes per iteration. The basic scheme is: |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4339 |
// lvx: load vector (Big Endian needs reversal) |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4340 |
// vpmsumw: carry-less 32 bit multiplications with constant representing a large CRC shift |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4341 |
// vxor: xor partial results together to get unroll_factor2 vectors |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4342 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4343 |
// Outer loop performs the CRC shifts needed to combine the unroll_factor2 vectors. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4344 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4345 |
// Using 16 * unroll_factor / unroll_factor_2 bytes for constants. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4346 |
const int unroll_factor = 2048; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4347 |
const int unroll_factor2 = 8; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4348 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4349 |
// Support registers. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4350 |
Register offs[] = { noreg, t0, t1, t2, t3, t4, crc /* will live in VCRC */, R14 }; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4351 |
Register num_bytes = R15, |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4352 |
loop_count = R16, |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4353 |
cur_const = R17; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4354 |
// Constant array for outer loop: unroll_factor2 - 1 registers, |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4355 |
// Constant array for inner loop: unroll_factor / unroll_factor2 registers. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4356 |
VectorRegister consts0[] = { VR16, VR17, VR18, VR19, VR20, VR21, VR22 }, |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4357 |
consts1[] = { VR23, VR24 }; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4358 |
// Data register arrays: 2 arrays with unroll_factor2 registers. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4359 |
VectorRegister data0[] = { VR0, VR1, VR2, VR3, VR4, VR5, VR6, VR7 }, |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4360 |
data1[] = { VR8, VR9, VR10, VR11, VR12, VR13, VR14, VR15 }; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4361 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4362 |
VectorRegister VCRC = data0[0]; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4363 |
VectorRegister Vc = VR25; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4364 |
VectorRegister swap_bytes = VR26; // Only for Big Endian. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4365 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4366 |
// We have at least 1 iteration (ensured by caller). |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4367 |
Label L_outer_loop, L_inner_loop, L_last; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4368 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4369 |
// If supported set DSCR pre-fetch to deepest. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4370 |
if (VM_Version::has_mfdscr()) { |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4371 |
load_const_optimized(t0, VM_Version::_dscr_val | 7); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4372 |
mtdscr(t0); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4373 |
} |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4374 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4375 |
mtvrwz(VCRC, crc); // crc lives lives in VCRC, now |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4376 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4377 |
for (int i = 1; i < unroll_factor2; ++i) { |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4378 |
li(offs[i], 16 * i); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4379 |
} |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4380 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4381 |
// Load consts for outer loop |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4382 |
lvx(consts0[0], constants); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4383 |
for (int i = 1; i < unroll_factor2 - 1; ++i) { |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4384 |
lvx(consts0[i], offs[i], constants); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4385 |
} |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4386 |
addi(constants, constants, (unroll_factor2 - 1) * 16); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4387 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4388 |
load_const_optimized(num_bytes, 16 * unroll_factor); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4389 |
load_const_optimized(loop_count, unroll_factor / (2 * unroll_factor2) - 1); // One double-iteration peeled off. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4390 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4391 |
// Reuse data registers outside of the loop. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4392 |
VectorRegister Vtmp = data1[0]; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4393 |
VectorRegister Vtmp2 = data1[1]; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4394 |
VectorRegister zeroes = data1[2]; |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4395 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4396 |
vspltisb(Vtmp, 0); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4397 |
vsldoi(VCRC, Vtmp, VCRC, 8); // 96 bit zeroes, 32 bit CRC. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4398 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4399 |
// Load vector for vpermxor (to xor both 64 bit parts together) |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4400 |
lvsl(Vtmp, buf); // 000102030405060708090a0b0c0d0e0f |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4401 |
vspltisb(Vc, 4); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4402 |
vsl(Vc, Vtmp, Vc); // 00102030405060708090a0b0c0d0e0f0 |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4403 |
xxspltd(Vc->to_vsr(), Vc->to_vsr(), 0); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4404 |
vor(Vc, Vtmp, Vc); // 001122334455667708192a3b4c5d6e7f |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4405 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4406 |
#ifdef VM_LITTLE_ENDIAN |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4407 |
#define BE_swap_bytes(x) |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4408 |
#else |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4409 |
vspltisb(Vtmp2, 0xf); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4410 |
vxor(swap_bytes, Vtmp, Vtmp2); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4411 |
#define BE_swap_bytes(x) vperm(x, x, x, swap_bytes) |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4412 |
#endif |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4413 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4414 |
cmpd(CCR0, len, num_bytes); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4415 |
blt(CCR0, L_last); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4416 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4417 |
// ********** Main loop start ********** |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4418 |
align(32); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4419 |
bind(L_outer_loop); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4420 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4421 |
// Begin of unrolled first iteration (no xor). |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4422 |
lvx(data1[0], buf); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4423 |
mr(cur_const, constants); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4424 |
for (int i = 1; i < unroll_factor2 / 2; ++i) { |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4425 |
lvx(data1[i], offs[i], buf); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4426 |
} |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4427 |
vpermxor(VCRC, VCRC, VCRC, Vc); // xor both halves to 64 bit result. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4428 |
lvx(consts1[0], cur_const); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4429 |
mtctr(loop_count); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4430 |
for (int i = 0; i < unroll_factor2 / 2; ++i) { |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4431 |
BE_swap_bytes(data1[i]); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4432 |
if (i == 0) { vxor(data1[0], data1[0], VCRC); } // xor in previous CRC. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4433 |
lvx(data1[i + unroll_factor2 / 2], offs[i + unroll_factor2 / 2], buf); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4434 |
vpmsumw(data0[i], data1[i], consts1[0]); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4435 |
} |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4436 |
addi(buf, buf, 16 * unroll_factor2); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4437 |
subf(len, num_bytes, len); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4438 |
lvx(consts1[1], offs[1], cur_const); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4439 |
addi(cur_const, cur_const, 32); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4440 |
// Begin of unrolled second iteration (head). |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4441 |
for (int i = 0; i < unroll_factor2 / 2; ++i) { |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4442 |
BE_swap_bytes(data1[i + unroll_factor2 / 2]); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4443 |
if (i == 0) { lvx(data1[0], buf); } else { lvx(data1[i], offs[i], buf); } |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4444 |
vpmsumw(data0[i + unroll_factor2 / 2], data1[i + unroll_factor2 / 2], consts1[0]); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4445 |
} |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4446 |
for (int i = 0; i < unroll_factor2 / 2; ++i) { |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4447 |
BE_swap_bytes(data1[i]); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4448 |
lvx(data1[i + unroll_factor2 / 2], offs[i + unroll_factor2 / 2], buf); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4449 |
vpmsumw(data1[i], data1[i], consts1[1]); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4450 |
} |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4451 |
addi(buf, buf, 16 * unroll_factor2); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4452 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4453 |
// Generate most performance relevant code. Loads + half of the vpmsumw have been generated. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4454 |
// Double-iteration allows using the 2 constant registers alternatingly. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4455 |
align(32); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4456 |
bind(L_inner_loop); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4457 |
for (int j = 1; j < 3; ++j) { // j < unroll_factor / unroll_factor2 - 1 for complete unrolling. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4458 |
if (j & 1) { |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4459 |
lvx(consts1[0], cur_const); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4460 |
} else { |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4461 |
lvx(consts1[1], offs[1], cur_const); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4462 |
addi(cur_const, cur_const, 32); |
41334 | 4463 |
} |
49376
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4464 |
for (int i = 0; i < unroll_factor2; ++i) { |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4465 |
int idx = i + unroll_factor2 / 2, inc = 0; // For modulo-scheduled input. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4466 |
if (idx >= unroll_factor2) { idx -= unroll_factor2; inc = 1; } |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4467 |
BE_swap_bytes(data1[idx]); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4468 |
vxor(data0[i], data0[i], data1[i]); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4469 |
if (i == 0) lvx(data1[0], buf); else lvx(data1[i], offs[i], buf); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4470 |
vpmsumw(data1[idx], data1[idx], consts1[(j + inc) & 1]); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4471 |
} |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4472 |
addi(buf, buf, 16 * unroll_factor2); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4473 |
} |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4474 |
bdnz(L_inner_loop); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4475 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4476 |
// Tail of last iteration (no loads). |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4477 |
for (int i = 0; i < unroll_factor2 / 2; ++i) { |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4478 |
BE_swap_bytes(data1[i + unroll_factor2 / 2]); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4479 |
vxor(data0[i], data0[i], data1[i]); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4480 |
vpmsumw(data1[i + unroll_factor2 / 2], data1[i + unroll_factor2 / 2], consts1[1]); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4481 |
} |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4482 |
for (int i = 0; i < unroll_factor2 / 2; ++i) { |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4483 |
vpmsumw(data0[i], data0[i], consts0[unroll_factor2 - 2 - i]); // First half of fixup shifts. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4484 |
vxor(data0[i + unroll_factor2 / 2], data0[i + unroll_factor2 / 2], data1[i + unroll_factor2 / 2]); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4485 |
} |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4486 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4487 |
// Last data register is ok, other ones need fixup shift. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4488 |
for (int i = unroll_factor2 / 2; i < unroll_factor2 - 1; ++i) { |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4489 |
vpmsumw(data0[i], data0[i], consts0[unroll_factor2 - 2 - i]); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4490 |
} |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4491 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4492 |
// Combine to 128 bit result vector VCRC = data0[0]. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4493 |
for (int i = 1; i < unroll_factor2; i<<=1) { |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4494 |
for (int j = 0; j <= unroll_factor2 - 2*i; j+=2*i) { |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4495 |
vxor(data0[j], data0[j], data0[j+i]); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4496 |
} |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4497 |
} |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4498 |
cmpd(CCR0, len, num_bytes); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4499 |
bge(CCR0, L_outer_loop); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4500 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4501 |
// Last chance with lower num_bytes. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4502 |
bind(L_last); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4503 |
srdi(loop_count, len, exact_log2(16 * 2 * unroll_factor2)); // Use double-iterations. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4504 |
add_const_optimized(constants, constants, 16 * (unroll_factor / unroll_factor2)); // Point behind last one. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4505 |
sldi(R0, loop_count, exact_log2(16 * 2)); // Bytes of constants to be used. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4506 |
clrrdi(num_bytes, len, exact_log2(16 * 2 * unroll_factor2)); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4507 |
subf(constants, R0, constants); // Point to constant to be used first. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4508 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4509 |
addic_(loop_count, loop_count, -1); // One double-iteration peeled off. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4510 |
bgt(CCR0, L_outer_loop); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4511 |
// ********** Main loop end ********** |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4512 |
#undef BE_swap_bytes |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4513 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4514 |
// Restore DSCR pre-fetch value. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4515 |
if (VM_Version::has_mfdscr()) { |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4516 |
load_const_optimized(t0, VM_Version::_dscr_val); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4517 |
mtdscr(t0); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4518 |
} |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4519 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4520 |
vspltisb(zeroes, 0); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4521 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4522 |
// Combine to 64 bit result. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4523 |
vpermxor(VCRC, VCRC, VCRC, Vc); // xor both halves to 64 bit result. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4524 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4525 |
// Reduce to 32 bit CRC: Remainder by multiply-high. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4526 |
lvx(Vtmp, barretConstants); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4527 |
vsldoi(Vtmp2, zeroes, VCRC, 12); // Extract high 32 bit. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4528 |
vpmsumd(Vtmp2, Vtmp2, Vtmp); // Multiply by inverse long poly. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4529 |
vsldoi(Vtmp2, zeroes, Vtmp2, 12); // Extract high 32 bit. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4530 |
vsldoi(Vtmp, zeroes, Vtmp, 8); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4531 |
vpmsumd(Vtmp2, Vtmp2, Vtmp); // Multiply quotient by long poly. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4532 |
vxor(VCRC, VCRC, Vtmp2); // Remainder fits into 32 bit. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4533 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4534 |
// Move result. len is already updated. |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4535 |
vsldoi(VCRC, VCRC, zeroes, 8); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4536 |
mfvrd(crc, VCRC); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4537 |
|
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4538 |
// Restore non-volatile Vector registers (frameless). |
41334 | 4539 |
offsetInt = 0; |
49376
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4540 |
offsetInt -= 16; li(offset, offsetInt); lvx(VR20, offset, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4541 |
offsetInt -= 16; li(offset, offsetInt); lvx(VR21, offset, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4542 |
offsetInt -= 16; li(offset, offsetInt); lvx(VR22, offset, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4543 |
offsetInt -= 16; li(offset, offsetInt); lvx(VR23, offset, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4544 |
offsetInt -= 16; li(offset, offsetInt); lvx(VR24, offset, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4545 |
offsetInt -= 16; li(offset, offsetInt); lvx(VR25, offset, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4546 |
#ifndef VM_LITTLE_ENDIAN |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4547 |
offsetInt -= 16; li(offset, offsetInt); lvx(VR26, offset, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4548 |
#endif |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4549 |
offsetInt -= 8; ld(R14, offsetInt, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4550 |
offsetInt -= 8; ld(R15, offsetInt, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4551 |
offsetInt -= 8; ld(R16, offsetInt, R1_SP); |
7cd503c499a0
8198894: [PPC64] More generic vector CRC implementation
mdoerr
parents:
49347
diff
changeset
|
4552 |
offsetInt -= 8; ld(R17, offsetInt, R1_SP); |
41334 | 4553 |
} |
4554 |
||
46317
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4555 |
void MacroAssembler::kernel_crc32_singleByte(Register crc, Register buf, Register len, Register table, Register tmp, bool invertCRC) { |
31861 | 4556 |
assert_different_registers(crc, buf, /* len, not used!! */ table, tmp); |
4557 |
||
4558 |
BLOCK_COMMENT("kernel_crc32_singleByte:"); |
|
46317
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4559 |
if (invertCRC) { |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4560 |
nand(crc, crc, crc); // 1s complement of crc |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4561 |
} |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4562 |
|
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4563 |
lbz(tmp, 0, buf); // Byte from buffer, zero-extended. |
31861 | 4564 |
update_byte_crc32(crc, tmp, table); |
4565 |
||
46317
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4566 |
if (invertCRC) { |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4567 |
nand(crc, crc, crc); // 1s complement of crc |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4568 |
} |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4569 |
} |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4570 |
|
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4571 |
void MacroAssembler::kernel_crc32_singleByteReg(Register crc, Register val, Register table, bool invertCRC) { |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4572 |
assert_different_registers(crc, val, table); |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4573 |
|
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4574 |
BLOCK_COMMENT("kernel_crc32_singleByteReg:"); |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4575 |
if (invertCRC) { |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4576 |
nand(crc, crc, crc); // 1s complement of crc |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4577 |
} |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4578 |
|
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4579 |
update_byte_crc32(crc, val, table); |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4580 |
|
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4581 |
if (invertCRC) { |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4582 |
nand(crc, crc, crc); // 1s complement of crc |
5f88747fe29e
8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents:
43428
diff
changeset
|
4583 |
} |
31861 | 4584 |
} |
4585 |
||
31773 | 4586 |
// dest_lo += src1 + src2 |
4587 |
// dest_hi += carry1 + carry2 |
|
4588 |
void MacroAssembler::add2_with_carry(Register dest_hi, |
|
4589 |
Register dest_lo, |
|
4590 |
Register src1, Register src2) { |
|
4591 |
li(R0, 0); |
|
4592 |
addc(dest_lo, dest_lo, src1); |
|
4593 |
adde(dest_hi, dest_hi, R0); |
|
4594 |
addc(dest_lo, dest_lo, src2); |
|
4595 |
adde(dest_hi, dest_hi, R0); |
|
4596 |
} |
|
4597 |
||
4598 |
// Multiply 64 bit by 64 bit first loop. |
|
4599 |
void MacroAssembler::multiply_64_x_64_loop(Register x, Register xstart, |
|
4600 |
Register x_xstart, |
|
4601 |
Register y, Register y_idx, |
|
4602 |
Register z, |
|
4603 |
Register carry, |
|
4604 |
Register product_high, Register product, |
|
4605 |
Register idx, Register kdx, |
|
4606 |
Register tmp) { |
|
4607 |
// jlong carry, x[], y[], z[]; |
|
4608 |
// for (int idx=ystart, kdx=ystart+1+xstart; idx >= 0; idx--, kdx--) { |
|
4609 |
// huge_128 product = y[idx] * x[xstart] + carry; |
|
4610 |
// z[kdx] = (jlong)product; |
|
4611 |
// carry = (jlong)(product >>> 64); |
|
4612 |
// } |
|
4613 |
// z[xstart] = carry; |
|
4614 |
||
4615 |
Label L_first_loop, L_first_loop_exit; |
|
4616 |
Label L_one_x, L_one_y, L_multiply; |
|
4617 |
||
4618 |
addic_(xstart, xstart, -1); |
|
4619 |
blt(CCR0, L_one_x); // Special case: length of x is 1. |
|
4620 |
||
4621 |
// Load next two integers of x. |
|
4622 |
sldi(tmp, xstart, LogBytesPerInt); |
|
4623 |
ldx(x_xstart, x, tmp); |
|
4624 |
#ifdef VM_LITTLE_ENDIAN |
|
4625 |
rldicl(x_xstart, x_xstart, 32, 0); |
|
4626 |
#endif |
|
4627 |
||
4628 |
align(32, 16); |
|
4629 |
bind(L_first_loop); |
|
4630 |
||
4631 |
cmpdi(CCR0, idx, 1); |
|
4632 |
blt(CCR0, L_first_loop_exit); |
|
4633 |
addi(idx, idx, -2); |
|
4634 |
beq(CCR0, L_one_y); |
|
4635 |
||
4636 |
// Load next two integers of y. |
|
4637 |
sldi(tmp, idx, LogBytesPerInt); |
|
4638 |
ldx(y_idx, y, tmp); |
|
4639 |
#ifdef VM_LITTLE_ENDIAN |
|
4640 |
rldicl(y_idx, y_idx, 32, 0); |
|
4641 |
#endif |
|
4642 |
||
4643 |
||
4644 |
bind(L_multiply); |
|
4645 |
multiply64(product_high, product, x_xstart, y_idx); |
|
4646 |
||
4647 |
li(tmp, 0); |
|
4648 |
addc(product, product, carry); // Add carry to result. |
|
4649 |
adde(product_high, product_high, tmp); // Add carry of the last addition. |
|
4650 |
addi(kdx, kdx, -2); |
|
4651 |
||
4652 |
// Store result. |
|
4653 |
#ifdef VM_LITTLE_ENDIAN |
|
4654 |
rldicl(product, product, 32, 0); |
|
4655 |
#endif |
|
4656 |
sldi(tmp, kdx, LogBytesPerInt); |
|
4657 |
stdx(product, z, tmp); |
|
4658 |
mr_if_needed(carry, product_high); |
|
4659 |
b(L_first_loop); |
|
4660 |
||
4661 |
||
4662 |
bind(L_one_y); // Load one 32 bit portion of y as (0,value). |
|
4663 |
||
4664 |
lwz(y_idx, 0, y); |
|
4665 |
b(L_multiply); |
|
4666 |
||
4667 |
||
31861 | 4668 |
bind(L_one_x); // Load one 32 bit portion of x as (0,value). |
31773 | 4669 |
|
4670 |
lwz(x_xstart, 0, x); |
|
4671 |
b(L_first_loop); |
|
4672 |
||
4673 |
bind(L_first_loop_exit); |
|
4674 |
} |
|
4675 |
||
4676 |
// Multiply 64 bit by 64 bit and add 128 bit. |
|
4677 |
void MacroAssembler::multiply_add_128_x_128(Register x_xstart, Register y, |
|
4678 |
Register z, Register yz_idx, |
|
4679 |
Register idx, Register carry, |
|
4680 |
Register product_high, Register product, |
|
4681 |
Register tmp, int offset) { |
|
4682 |
||
4683 |
// huge_128 product = (y[idx] * x_xstart) + z[kdx] + carry; |
|
4684 |
// z[kdx] = (jlong)product; |
|
4685 |
||
4686 |
sldi(tmp, idx, LogBytesPerInt); |
|
31861 | 4687 |
if (offset) { |
31773 | 4688 |
addi(tmp, tmp, offset); |
4689 |
} |
|
4690 |
ldx(yz_idx, y, tmp); |
|
4691 |
#ifdef VM_LITTLE_ENDIAN |
|
4692 |
rldicl(yz_idx, yz_idx, 32, 0); |
|
4693 |
#endif |
|
4694 |
||
4695 |
multiply64(product_high, product, x_xstart, yz_idx); |
|
4696 |
ldx(yz_idx, z, tmp); |
|
4697 |
#ifdef VM_LITTLE_ENDIAN |
|
4698 |
rldicl(yz_idx, yz_idx, 32, 0); |
|
4699 |
#endif |
|
4700 |
||
4701 |
add2_with_carry(product_high, product, carry, yz_idx); |
|
4702 |
||
4703 |
sldi(tmp, idx, LogBytesPerInt); |
|
31861 | 4704 |
if (offset) { |
31773 | 4705 |
addi(tmp, tmp, offset); |
4706 |
} |
|
4707 |
#ifdef VM_LITTLE_ENDIAN |
|
4708 |
rldicl(product, product, 32, 0); |
|
4709 |
#endif |
|
4710 |
stdx(product, z, tmp); |
|
4711 |
} |
|
4712 |
||
4713 |
// Multiply 128 bit by 128 bit. Unrolled inner loop. |
|
4714 |
void MacroAssembler::multiply_128_x_128_loop(Register x_xstart, |
|
4715 |
Register y, Register z, |
|
4716 |
Register yz_idx, Register idx, Register carry, |
|
4717 |
Register product_high, Register product, |
|
4718 |
Register carry2, Register tmp) { |
|
4719 |
||
4720 |
// jlong carry, x[], y[], z[]; |
|
4721 |
// int kdx = ystart+1; |
|
4722 |
// for (int idx=ystart-2; idx >= 0; idx -= 2) { // Third loop |
|
4723 |
// huge_128 product = (y[idx+1] * x_xstart) + z[kdx+idx+1] + carry; |
|
4724 |
// z[kdx+idx+1] = (jlong)product; |
|
4725 |
// jlong carry2 = (jlong)(product >>> 64); |
|
4726 |
// product = (y[idx] * x_xstart) + z[kdx+idx] + carry2; |
|
4727 |
// z[kdx+idx] = (jlong)product; |
|
4728 |
// carry = (jlong)(product >>> 64); |
|
4729 |
// } |
|
4730 |
// idx += 2; |
|
4731 |
// if (idx > 0) { |
|
4732 |
// product = (y[idx] * x_xstart) + z[kdx+idx] + carry; |
|
4733 |
// z[kdx+idx] = (jlong)product; |
|
4734 |
// carry = (jlong)(product >>> 64); |
|
4735 |
// } |
|
4736 |
||
4737 |
Label L_third_loop, L_third_loop_exit, L_post_third_loop_done; |
|
4738 |
const Register jdx = R0; |
|
4739 |
||
4740 |
// Scale the index. |
|
4741 |
srdi_(jdx, idx, 2); |
|
4742 |
beq(CCR0, L_third_loop_exit); |
|
4743 |
mtctr(jdx); |
|
4744 |
||
4745 |
align(32, 16); |
|
4746 |
bind(L_third_loop); |
|
4747 |
||
4748 |
addi(idx, idx, -4); |
|
4749 |
||
4750 |
multiply_add_128_x_128(x_xstart, y, z, yz_idx, idx, carry, product_high, product, tmp, 8); |
|
4751 |
mr_if_needed(carry2, product_high); |
|
4752 |
||
4753 |
multiply_add_128_x_128(x_xstart, y, z, yz_idx, idx, carry2, product_high, product, tmp, 0); |
|
4754 |
mr_if_needed(carry, product_high); |
|
4755 |
bdnz(L_third_loop); |
|
4756 |
||
4757 |
bind(L_third_loop_exit); // Handle any left-over operand parts. |
|
4758 |
||
4759 |
andi_(idx, idx, 0x3); |
|
4760 |
beq(CCR0, L_post_third_loop_done); |
|
4761 |
||
4762 |
Label L_check_1; |
|
4763 |
||
4764 |
addic_(idx, idx, -2); |
|
4765 |
blt(CCR0, L_check_1); |
|
4766 |
||
4767 |
multiply_add_128_x_128(x_xstart, y, z, yz_idx, idx, carry, product_high, product, tmp, 0); |
|
4768 |
mr_if_needed(carry, product_high); |
|
4769 |
||
4770 |
bind(L_check_1); |
|
4771 |
||
4772 |
addi(idx, idx, 0x2); |
|
35085 | 4773 |
andi_(idx, idx, 0x1); |
31773 | 4774 |
addic_(idx, idx, -1); |
4775 |
blt(CCR0, L_post_third_loop_done); |
|
4776 |
||
4777 |
sldi(tmp, idx, LogBytesPerInt); |
|
4778 |
lwzx(yz_idx, y, tmp); |
|
4779 |
multiply64(product_high, product, x_xstart, yz_idx); |
|
4780 |
lwzx(yz_idx, z, tmp); |
|
4781 |
||
4782 |
add2_with_carry(product_high, product, yz_idx, carry); |
|
4783 |
||
4784 |
sldi(tmp, idx, LogBytesPerInt); |
|
4785 |
stwx(product, z, tmp); |
|
4786 |
srdi(product, product, 32); |
|
4787 |
||
4788 |
sldi(product_high, product_high, 32); |
|
4789 |
orr(product, product, product_high); |
|
4790 |
mr_if_needed(carry, product); |
|
4791 |
||
4792 |
bind(L_post_third_loop_done); |
|
4793 |
} // multiply_128_x_128_loop |
|
4794 |
||
47521
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4795 |
void MacroAssembler::muladd(Register out, Register in, |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4796 |
Register offset, Register len, Register k, |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4797 |
Register tmp1, Register tmp2, Register carry) { |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4798 |
|
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4799 |
// Labels |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4800 |
Label LOOP, SKIP; |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4801 |
|
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4802 |
// Make sure length is positive. |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4803 |
cmpdi (CCR0, len, 0); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4804 |
|
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4805 |
// Prepare variables |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4806 |
subi (offset, offset, 4); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4807 |
li (carry, 0); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4808 |
ble (CCR0, SKIP); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4809 |
|
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4810 |
mtctr (len); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4811 |
subi (len, len, 1 ); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4812 |
sldi (len, len, 2 ); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4813 |
|
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4814 |
// Main loop |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4815 |
bind(LOOP); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4816 |
lwzx (tmp1, len, in ); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4817 |
lwzx (tmp2, offset, out ); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4818 |
mulld (tmp1, tmp1, k ); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4819 |
add (tmp2, carry, tmp2 ); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4820 |
add (tmp2, tmp1, tmp2 ); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4821 |
stwx (tmp2, offset, out ); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4822 |
srdi (carry, tmp2, 32 ); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4823 |
subi (offset, offset, 4 ); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4824 |
subi (len, len, 4 ); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4825 |
bdnz (LOOP); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4826 |
bind(SKIP); |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4827 |
} |
122833427b36
8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents:
47520
diff
changeset
|
4828 |
|
31773 | 4829 |
void MacroAssembler::multiply_to_len(Register x, Register xlen, |
4830 |
Register y, Register ylen, |
|
4831 |
Register z, Register zlen, |
|
4832 |
Register tmp1, Register tmp2, |
|
4833 |
Register tmp3, Register tmp4, |
|
4834 |
Register tmp5, Register tmp6, |
|
4835 |
Register tmp7, Register tmp8, |
|
4836 |
Register tmp9, Register tmp10, |
|
4837 |
Register tmp11, Register tmp12, |
|
4838 |
Register tmp13) { |
|
4839 |
||
4840 |
ShortBranchVerifier sbv(this); |
|
4841 |
||
4842 |
assert_different_registers(x, xlen, y, ylen, z, zlen, |
|
4843 |
tmp1, tmp2, tmp3, tmp4, tmp5, tmp6); |
|
4844 |
assert_different_registers(x, xlen, y, ylen, z, zlen, |
|
4845 |
tmp1, tmp2, tmp3, tmp4, tmp5, tmp7); |
|
4846 |
assert_different_registers(x, xlen, y, ylen, z, zlen, |
|
4847 |
tmp1, tmp2, tmp3, tmp4, tmp5, tmp8); |
|
4848 |
||
4849 |
const Register idx = tmp1; |
|
4850 |
const Register kdx = tmp2; |
|
4851 |
const Register xstart = tmp3; |
|
4852 |
||
4853 |
const Register y_idx = tmp4; |
|
4854 |
const Register carry = tmp5; |
|
4855 |
const Register product = tmp6; |
|
4856 |
const Register product_high = tmp7; |
|
4857 |
const Register x_xstart = tmp8; |
|
4858 |
const Register tmp = tmp9; |
|
4859 |
||
4860 |
// First Loop. |
|
4861 |
// |
|
4862 |
// final static long LONG_MASK = 0xffffffffL; |
|
4863 |
// int xstart = xlen - 1; |
|
4864 |
// int ystart = ylen - 1; |
|
4865 |
// long carry = 0; |
|
4866 |
// for (int idx=ystart, kdx=ystart+1+xstart; idx >= 0; idx-, kdx--) { |
|
4867 |
// long product = (y[idx] & LONG_MASK) * (x[xstart] & LONG_MASK) + carry; |
|
4868 |
// z[kdx] = (int)product; |
|
4869 |
// carry = product >>> 32; |
|
4870 |
// } |
|
4871 |
// z[xstart] = (int)carry; |
|
4872 |
||
4873 |
mr_if_needed(idx, ylen); // idx = ylen |
|
4874 |
mr_if_needed(kdx, zlen); // kdx = xlen + ylen |
|
4875 |
li(carry, 0); // carry = 0 |
|
4876 |
||
4877 |
Label L_done; |
|
4878 |
||
4879 |
addic_(xstart, xlen, -1); |
|
4880 |
blt(CCR0, L_done); |
|
4881 |
||
4882 |
multiply_64_x_64_loop(x, xstart, x_xstart, y, y_idx, z, |
|
4883 |
carry, product_high, product, idx, kdx, tmp); |
|
4884 |
||
4885 |
Label L_second_loop; |
|
4886 |
||
4887 |
cmpdi(CCR0, kdx, 0); |
|
4888 |
beq(CCR0, L_second_loop); |
|
4889 |
||
4890 |
Label L_carry; |
|
4891 |
||
4892 |
addic_(kdx, kdx, -1); |
|
4893 |
beq(CCR0, L_carry); |
|
4894 |
||
4895 |
// Store lower 32 bits of carry. |
|
4896 |
sldi(tmp, kdx, LogBytesPerInt); |
|
4897 |
stwx(carry, z, tmp); |
|
4898 |
srdi(carry, carry, 32); |
|
4899 |
addi(kdx, kdx, -1); |
|
4900 |
||
4901 |
||
4902 |
bind(L_carry); |
|
4903 |
||
4904 |
// Store upper 32 bits of carry. |
|
4905 |
sldi(tmp, kdx, LogBytesPerInt); |
|
4906 |
stwx(carry, z, tmp); |
|
4907 |
||
4908 |
// Second and third (nested) loops. |
|
4909 |
// |
|
4910 |
// for (int i = xstart-1; i >= 0; i--) { // Second loop |
|
4911 |
// carry = 0; |
|
4912 |
// for (int jdx=ystart, k=ystart+1+i; jdx >= 0; jdx--, k--) { // Third loop |
|
4913 |
// long product = (y[jdx] & LONG_MASK) * (x[i] & LONG_MASK) + |
|
4914 |
// (z[k] & LONG_MASK) + carry; |
|
4915 |
// z[k] = (int)product; |
|
4916 |
// carry = product >>> 32; |
|
4917 |
// } |
|
4918 |
// z[i] = (int)carry; |
|
4919 |
// } |
|
4920 |
// |
|
4921 |
// i = xlen, j = tmp1, k = tmp2, carry = tmp5, x[i] = rdx |
|
4922 |
||
4923 |
bind(L_second_loop); |
|
4924 |
||
4925 |
li(carry, 0); // carry = 0; |
|
4926 |
||
4927 |
addic_(xstart, xstart, -1); // i = xstart-1; |
|
4928 |
blt(CCR0, L_done); |
|
4929 |
||
4930 |
Register zsave = tmp10; |
|
4931 |
||
4932 |
mr(zsave, z); |
|
4933 |
||
4934 |
||
4935 |
Label L_last_x; |
|
4936 |
||
4937 |
sldi(tmp, xstart, LogBytesPerInt); |
|
4938 |
add(z, z, tmp); // z = z + k - j |
|
4939 |
addi(z, z, 4); |
|
4940 |
addic_(xstart, xstart, -1); // i = xstart-1; |
|
4941 |
blt(CCR0, L_last_x); |
|
4942 |
||
4943 |
sldi(tmp, xstart, LogBytesPerInt); |
|
4944 |
ldx(x_xstart, x, tmp); |
|
4945 |
#ifdef VM_LITTLE_ENDIAN |
|
4946 |
rldicl(x_xstart, x_xstart, 32, 0); |
|
4947 |
#endif |
|
4948 |
||
4949 |
||
4950 |
Label L_third_loop_prologue; |
|
4951 |
||
4952 |
bind(L_third_loop_prologue); |
|
4953 |
||
4954 |
Register xsave = tmp11; |
|
4955 |
Register xlensave = tmp12; |
|
4956 |
Register ylensave = tmp13; |
|
4957 |
||
4958 |
mr(xsave, x); |
|
4959 |
mr(xlensave, xstart); |
|
4960 |
mr(ylensave, ylen); |
|
4961 |
||
4962 |
||
4963 |
multiply_128_x_128_loop(x_xstart, y, z, y_idx, ylen, |
|
4964 |
carry, product_high, product, x, tmp); |
|
4965 |
||
4966 |
mr(z, zsave); |
|
4967 |
mr(x, xsave); |
|
4968 |
mr(xlen, xlensave); // This is the decrement of the loop counter! |
|
4969 |
mr(ylen, ylensave); |
|
4970 |
||
4971 |
addi(tmp3, xlen, 1); |
|
4972 |
sldi(tmp, tmp3, LogBytesPerInt); |
|
4973 |
stwx(carry, z, tmp); |
|
4974 |
addic_(tmp3, tmp3, -1); |
|
4975 |
blt(CCR0, L_done); |
|
4976 |
||
4977 |
srdi(carry, carry, 32); |
|
4978 |
sldi(tmp, tmp3, LogBytesPerInt); |
|
4979 |
stwx(carry, z, tmp); |
|
4980 |
b(L_second_loop); |
|
4981 |
||
4982 |
// Next infrequent code is moved outside loops. |
|
4983 |
bind(L_last_x); |
|
4984 |
||
4985 |
lwz(x_xstart, 0, x); |
|
4986 |
b(L_third_loop_prologue); |
|
4987 |
||
4988 |
bind(L_done); |
|
4989 |
} // multiply_to_len |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
4990 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
4991 |
void MacroAssembler::asm_assert(bool check_equal, const char *msg, int id) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
4992 |
#ifdef ASSERT |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
4993 |
Label ok; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
4994 |
if (check_equal) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
4995 |
beq(CCR0, ok); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
4996 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
4997 |
bne(CCR0, ok); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
4998 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
4999 |
stop(msg, id); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5000 |
bind(ok); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5001 |
#endif |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5002 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5003 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5004 |
void MacroAssembler::asm_assert_mems_zero(bool check_equal, int size, int mem_offset, |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5005 |
Register mem_base, const char* msg, int id) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5006 |
#ifdef ASSERT |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5007 |
switch (size) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5008 |
case 4: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5009 |
lwz(R0, mem_offset, mem_base); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5010 |
cmpwi(CCR0, R0, 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5011 |
break; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5012 |
case 8: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5013 |
ld(R0, mem_offset, mem_base); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5014 |
cmpdi(CCR0, R0, 0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5015 |
break; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5016 |
default: |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5017 |
ShouldNotReachHere(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5018 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5019 |
asm_assert(check_equal, msg, id); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5020 |
#endif // ASSERT |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5021 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5022 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5023 |
void MacroAssembler::verify_thread() { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5024 |
if (VerifyThread) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5025 |
unimplemented("'VerifyThread' currently not implemented on PPC"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5026 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5027 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5028 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5029 |
// READ: oop. KILL: R0. Volatile floats perhaps. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5030 |
void MacroAssembler::verify_oop(Register oop, const char* msg) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5031 |
if (!VerifyOops) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5032 |
return; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5033 |
} |
28187
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
5034 |
|
22861 | 5035 |
address/* FunctionDescriptor** */fd = StubRoutines::verify_oop_subroutine_entry_address(); |
28187
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
5036 |
const Register tmp = R11; // Will be preserved. |
35085 | 5037 |
const int nbytes_save = MacroAssembler::num_volatile_regs * 8; |
28187
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
5038 |
save_volatile_gprs(R1_SP, -nbytes_save); // except R0 |
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
5039 |
|
35085 | 5040 |
mr_if_needed(R4_ARG2, oop); |
28187
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
5041 |
save_LR_CR(tmp); // save in old frame |
23211 | 5042 |
push_frame_reg_args(nbytes_save, tmp); |
5043 |
// load FunctionDescriptor** / entry_address * |
|
28187
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
5044 |
load_const_optimized(tmp, fd, R0); |
23211 | 5045 |
// load FunctionDescriptor* / entry_address |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5046 |
ld(tmp, 0, tmp); |
35085 | 5047 |
load_const_optimized(R3_ARG1, (address)msg, R0); |
5048 |
// Call destination for its side effect. |
|
5049 |
call_c(tmp); |
|
5050 |
||
5051 |
pop_frame(); |
|
5052 |
restore_LR_CR(tmp); |
|
5053 |
restore_volatile_gprs(R1_SP, -nbytes_save); // except R0 |
|
5054 |
} |
|
5055 |
||
5056 |
void MacroAssembler::verify_oop_addr(RegisterOrConstant offs, Register base, const char* msg) { |
|
5057 |
if (!VerifyOops) { |
|
5058 |
return; |
|
5059 |
} |
|
5060 |
||
5061 |
address/* FunctionDescriptor** */fd = StubRoutines::verify_oop_subroutine_entry_address(); |
|
5062 |
const Register tmp = R11; // Will be preserved. |
|
5063 |
const int nbytes_save = MacroAssembler::num_volatile_regs * 8; |
|
5064 |
save_volatile_gprs(R1_SP, -nbytes_save); // except R0 |
|
5065 |
||
5066 |
ld(R4_ARG2, offs, base); |
|
5067 |
save_LR_CR(tmp); // save in old frame |
|
5068 |
push_frame_reg_args(nbytes_save, tmp); |
|
5069 |
// load FunctionDescriptor** / entry_address * |
|
5070 |
load_const_optimized(tmp, fd, R0); |
|
5071 |
// load FunctionDescriptor* / entry_address |
|
5072 |
ld(tmp, 0, tmp); |
|
28187
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
5073 |
load_const_optimized(R3_ARG1, (address)msg, R0); |
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
5074 |
// Call destination for its side effect. |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5075 |
call_c(tmp); |
28187
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
5076 |
|
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5077 |
pop_frame(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5078 |
restore_LR_CR(tmp); |
28187
fc19df82d6ee
8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents:
27012
diff
changeset
|
5079 |
restore_volatile_gprs(R1_SP, -nbytes_save); // except R0 |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5080 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5081 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5082 |
const char* stop_types[] = { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5083 |
"stop", |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5084 |
"untested", |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5085 |
"unimplemented", |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5086 |
"shouldnotreachhere" |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5087 |
}; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5088 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5089 |
static void stop_on_request(int tp, const char* msg) { |
25374
d7fb2af5d53c
8048169: Change 8037816 breaks HS build on PPC64 and CPP-Interpreter platforms
coleenp
parents:
23492
diff
changeset
|
5090 |
tty->print("PPC assembly code requires stop: (%s) %s\n", stop_types[tp%/*stop_end*/4], msg); |
33105
294e48b4f704
8080775: Better argument formatting for assert() and friends
david
parents:
32596
diff
changeset
|
5091 |
guarantee(false, "PPC assembly code requires stop: %s", msg); |
22824
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5092 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5093 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5094 |
// Call a C-function that prints output. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5095 |
void MacroAssembler::stop(int type, const char* msg, int id) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5096 |
#ifndef PRODUCT |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5097 |
block_comment(err_msg("stop: %s %s {", stop_types[type%stop_end], msg)); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5098 |
#else |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5099 |
block_comment("stop {"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5100 |
#endif |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5101 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5102 |
// setup arguments |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5103 |
load_const_optimized(R3_ARG1, type); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5104 |
load_const_optimized(R4_ARG2, (void *)msg, /*tmp=*/R0); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5105 |
call_VM_leaf(CAST_FROM_FN_PTR(address, stop_on_request), R3_ARG1, R4_ARG2); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5106 |
illtrap(); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5107 |
emit_int32(id); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5108 |
block_comment("} stop;"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5109 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5110 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5111 |
#ifndef PRODUCT |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5112 |
// Write pattern 0x0101010101010101 in memory region [low-before, high+after]. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5113 |
// Val, addr are temp registers. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5114 |
// If low == addr, addr is killed. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5115 |
// High is preserved. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5116 |
void MacroAssembler::zap_from_to(Register low, int before, Register high, int after, Register val, Register addr) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5117 |
if (!ZapMemory) return; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5118 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5119 |
assert_different_registers(low, val); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5120 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5121 |
BLOCK_COMMENT("zap memory region {"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5122 |
load_const_optimized(val, 0x0101010101010101); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5123 |
int size = before + after; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5124 |
if (low == high && size < 5 && size > 0) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5125 |
int offset = -before*BytesPerWord; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5126 |
for (int i = 0; i < size; ++i) { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5127 |
std(val, offset, low); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5128 |
offset += (1*BytesPerWord); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5129 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5130 |
} else { |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5131 |
addi(addr, low, -before*BytesPerWord); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5132 |
assert_different_registers(high, val); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5133 |
if (after) addi(high, high, after * BytesPerWord); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5134 |
Label loop; |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5135 |
bind(loop); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5136 |
std(val, 0, addr); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5137 |
addi(addr, addr, 8); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5138 |
cmpd(CCR6, addr, high); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5139 |
ble(CCR6, loop); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5140 |
if (after) addi(high, high, -after * BytesPerWord); // Correct back to old value. |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5141 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5142 |
BLOCK_COMMENT("} zap memory region"); |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5143 |
} |
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5144 |
|
28258dd5cb2e
8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff
changeset
|
5145 |
#endif // !PRODUCT |
23221 | 5146 |
|
48476 | 5147 |
void SkipIfEqualZero::skip_to_label_if_equal_zero(MacroAssembler* masm, Register temp, |
5148 |
const bool* flag_addr, Label& label) { |
|
23221 | 5149 |
int simm16_offset = masm->load_const_optimized(temp, (address)flag_addr, R0, true); |
5150 |
assert(sizeof(bool) == 1, "PowerPC ABI"); |
|
5151 |
masm->lbz(temp, simm16_offset, temp); |
|
5152 |
masm->cmpwi(CCR0, temp, 0); |
|
48476 | 5153 |
masm->beq(CCR0, label); |
5154 |
} |
|
5155 |
||
5156 |
SkipIfEqualZero::SkipIfEqualZero(MacroAssembler* masm, Register temp, const bool* flag_addr) : _masm(masm), _label() { |
|
5157 |
skip_to_label_if_equal_zero(masm, temp, flag_addr, _label); |
|
23221 | 5158 |
} |
5159 |
||
5160 |
SkipIfEqualZero::~SkipIfEqualZero() { |
|
5161 |
_masm->bind(_label); |
|
5162 |
} |