author | prr |
Wed, 15 Apr 2015 14:28:43 -0700 | |
changeset 30465 | a77083748efc |
parent 26579 | 522d6486f410 |
child 30217 | 5eb8768d86c4 |
permissions | -rw-r--r-- |
1 | 1 |
/* |
24953
9680119572be
8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents:
22554
diff
changeset
|
2 |
* Copyright (c) 1997, 2014, Oracle and/or its affiliates. All rights reserved. |
1 | 3 |
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. |
4 |
* |
|
5 |
* This code is free software; you can redistribute it and/or modify it |
|
6 |
* under the terms of the GNU General Public License version 2 only, as |
|
7 |
* published by the Free Software Foundation. |
|
8 |
* |
|
9 |
* This code is distributed in the hope that it will be useful, but WITHOUT |
|
10 |
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or |
|
11 |
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
|
12 |
* version 2 for more details (a copy is included in the LICENSE file that |
|
13 |
* accompanied this code). |
|
14 |
* |
|
15 |
* You should have received a copy of the GNU General Public License version |
|
16 |
* 2 along with this work; if not, write to the Free Software Foundation, |
|
17 |
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. |
|
18 |
* |
|
5547
f4b087cbb361
6941466: Oracle rebranding changes for Hotspot repositories
trims
parents:
2255
diff
changeset
|
19 |
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA |
f4b087cbb361
6941466: Oracle rebranding changes for Hotspot repositories
trims
parents:
2255
diff
changeset
|
20 |
* or visit www.oracle.com if you need additional information or have any |
f4b087cbb361
6941466: Oracle rebranding changes for Hotspot repositories
trims
parents:
2255
diff
changeset
|
21 |
* questions. |
1 | 22 |
* |
23 |
*/ |
|
24 |
||
7397 | 25 |
#ifndef CPU_SPARC_VM_VM_VERSION_SPARC_HPP |
26 |
#define CPU_SPARC_VM_VM_VERSION_SPARC_HPP |
|
27 |
||
28 |
#include "runtime/globals_extension.hpp" |
|
29 |
#include "runtime/vm_version.hpp" |
|
30 |
||
1 | 31 |
class VM_Version: public Abstract_VM_Version { |
32 |
protected: |
|
33 |
enum Feature_Flag { |
|
10252 | 34 |
v8_instructions = 0, |
35 |
hardware_mul32 = 1, |
|
36 |
hardware_div32 = 2, |
|
37 |
hardware_fsmuld = 3, |
|
38 |
hardware_popc = 4, |
|
39 |
v9_instructions = 5, |
|
40 |
vis1_instructions = 6, |
|
41 |
vis2_instructions = 7, |
|
42 |
sun4v_instructions = 8, |
|
7115
32300e243300
6987135: Performance regression on Intel platform with 32-bits edition between 6u13 and 6u14.
kvn
parents:
5547
diff
changeset
|
43 |
blk_init_instructions = 9, |
10252 | 44 |
fmaf_instructions = 10, |
45 |
fmau_instructions = 11, |
|
46 |
vis3_instructions = 12, |
|
13394 | 47 |
cbcond_instructions = 13, |
48 |
sparc64_family = 14, |
|
49 |
M_family = 15, |
|
50 |
T_family = 16, |
|
22505 | 51 |
T1_model = 17, |
22554
a19b9cf9ffa8
8031290: Adjust call to getisax() for additional words returned
jmasa
parents:
22505
diff
changeset
|
52 |
sparc5_instructions = 18, |
24953
9680119572be
8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents:
22554
diff
changeset
|
53 |
aes_instructions = 19, |
9680119572be
8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents:
22554
diff
changeset
|
54 |
sha1_instruction = 20, |
9680119572be
8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents:
22554
diff
changeset
|
55 |
sha256_instruction = 21, |
9680119572be
8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents:
22554
diff
changeset
|
56 |
sha512_instruction = 22 |
1 | 57 |
}; |
58 |
||
59 |
enum Feature_Flag_Set { |
|
2253
30268d00878e
6812587: Use auxv to determine SPARC hardware features on Solaris
twisti
parents:
670
diff
changeset
|
60 |
unknown_m = 0, |
30268d00878e
6812587: Use auxv to determine SPARC hardware features on Solaris
twisti
parents:
670
diff
changeset
|
61 |
all_features_m = -1, |
1 | 62 |
|
10252 | 63 |
v8_instructions_m = 1 << v8_instructions, |
64 |
hardware_mul32_m = 1 << hardware_mul32, |
|
65 |
hardware_div32_m = 1 << hardware_div32, |
|
66 |
hardware_fsmuld_m = 1 << hardware_fsmuld, |
|
67 |
hardware_popc_m = 1 << hardware_popc, |
|
68 |
v9_instructions_m = 1 << v9_instructions, |
|
69 |
vis1_instructions_m = 1 << vis1_instructions, |
|
70 |
vis2_instructions_m = 1 << vis2_instructions, |
|
71 |
sun4v_m = 1 << sun4v_instructions, |
|
7115
32300e243300
6987135: Performance regression on Intel platform with 32-bits edition between 6u13 and 6u14.
kvn
parents:
5547
diff
changeset
|
72 |
blk_init_instructions_m = 1 << blk_init_instructions, |
10252 | 73 |
fmaf_instructions_m = 1 << fmaf_instructions, |
74 |
fmau_instructions_m = 1 << fmau_instructions, |
|
75 |
vis3_instructions_m = 1 << vis3_instructions, |
|
13394 | 76 |
cbcond_instructions_m = 1 << cbcond_instructions, |
10252 | 77 |
sparc64_family_m = 1 << sparc64_family, |
13394 | 78 |
M_family_m = 1 << M_family, |
10252 | 79 |
T_family_m = 1 << T_family, |
80 |
T1_model_m = 1 << T1_model, |
|
22554
a19b9cf9ffa8
8031290: Adjust call to getisax() for additional words returned
jmasa
parents:
22505
diff
changeset
|
81 |
sparc5_instructions_m = 1 << sparc5_instructions, |
22505 | 82 |
aes_instructions_m = 1 << aes_instructions, |
24953
9680119572be
8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents:
22554
diff
changeset
|
83 |
sha1_instruction_m = 1 << sha1_instruction, |
9680119572be
8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents:
22554
diff
changeset
|
84 |
sha256_instruction_m = 1 << sha256_instruction, |
9680119572be
8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents:
22554
diff
changeset
|
85 |
sha512_instruction_m = 1 << sha512_instruction, |
1 | 86 |
|
2253
30268d00878e
6812587: Use auxv to determine SPARC hardware features on Solaris
twisti
parents:
670
diff
changeset
|
87 |
generic_v8_m = v8_instructions_m | hardware_mul32_m | hardware_div32_m | hardware_fsmuld_m, |
30268d00878e
6812587: Use auxv to determine SPARC hardware features on Solaris
twisti
parents:
670
diff
changeset
|
88 |
generic_v9_m = generic_v8_m | v9_instructions_m, |
30268d00878e
6812587: Use auxv to determine SPARC hardware features on Solaris
twisti
parents:
670
diff
changeset
|
89 |
ultra3_m = generic_v9_m | vis1_instructions_m | vis2_instructions_m, |
1 | 90 |
|
91 |
// Temporary until we have something more accurate |
|
2253
30268d00878e
6812587: Use auxv to determine SPARC hardware features on Solaris
twisti
parents:
670
diff
changeset
|
92 |
niagara1_unique_m = sun4v_m, |
30268d00878e
6812587: Use auxv to determine SPARC hardware features on Solaris
twisti
parents:
670
diff
changeset
|
93 |
niagara1_m = generic_v9_m | niagara1_unique_m |
1 | 94 |
}; |
95 |
||
96 |
static int _features; |
|
97 |
static const char* _features_str; |
|
98 |
||
26579
522d6486f410
8056124: Hotspot should use PICL interface to get cacheline size on SPARC
iveresov
parents:
24953
diff
changeset
|
99 |
static unsigned int _L2_cache_line_size; |
522d6486f410
8056124: Hotspot should use PICL interface to get cacheline size on SPARC
iveresov
parents:
24953
diff
changeset
|
100 |
static unsigned int L2_cache_line_size() { return _L2_cache_line_size; } |
522d6486f410
8056124: Hotspot should use PICL interface to get cacheline size on SPARC
iveresov
parents:
24953
diff
changeset
|
101 |
|
1 | 102 |
static void print_features(); |
103 |
static int determine_features(); |
|
104 |
static int platform_features(int features); |
|
105 |
||
7704 | 106 |
// Returns true if the platform is in the niagara line (T series) |
13394 | 107 |
static bool is_M_family(int features) { return (features & M_family_m) != 0; } |
7704 | 108 |
static bool is_T_family(int features) { return (features & T_family_m) != 0; } |
109 |
static bool is_niagara() { return is_T_family(_features); } |
|
21922
3c90a49d87a3
8029190: VM_Version::determine_features() asserts on Fujitsu Sparc64 CPUs
simonis
parents:
18097
diff
changeset
|
110 |
#ifdef ASSERT |
3c90a49d87a3
8029190: VM_Version::determine_features() asserts on Fujitsu Sparc64 CPUs
simonis
parents:
18097
diff
changeset
|
111 |
static bool is_niagara(int features) { |
3c90a49d87a3
8029190: VM_Version::determine_features() asserts on Fujitsu Sparc64 CPUs
simonis
parents:
18097
diff
changeset
|
112 |
// 'sun4v_m' may be defined on both Sun/Oracle Sparc CPUs as well as |
3c90a49d87a3
8029190: VM_Version::determine_features() asserts on Fujitsu Sparc64 CPUs
simonis
parents:
18097
diff
changeset
|
113 |
// on Fujitsu Sparc64 CPUs, but only Sun/Oracle Sparcs can be 'niagaras'. |
3c90a49d87a3
8029190: VM_Version::determine_features() asserts on Fujitsu Sparc64 CPUs
simonis
parents:
18097
diff
changeset
|
114 |
return (features & sun4v_m) != 0 && (features & sparc64_family_m) == 0; |
3c90a49d87a3
8029190: VM_Version::determine_features() asserts on Fujitsu Sparc64 CPUs
simonis
parents:
18097
diff
changeset
|
115 |
} |
3c90a49d87a3
8029190: VM_Version::determine_features() asserts on Fujitsu Sparc64 CPUs
simonis
parents:
18097
diff
changeset
|
116 |
#endif |
7704 | 117 |
|
118 |
// Returns true if it is niagara1 (T1). |
|
119 |
static bool is_T1_model(int features) { return is_T_family(features) && ((features & T1_model_m) != 0); } |
|
1 | 120 |
|
183
ba55c7f3fd45
6362677: Change parallel GC collector default number of parallel GC threads.
jmasa
parents:
1
diff
changeset
|
121 |
static int maximum_niagara1_processor_count() { return 32; } |
ba55c7f3fd45
6362677: Change parallel GC collector default number of parallel GC threads.
jmasa
parents:
1
diff
changeset
|
122 |
|
1 | 123 |
public: |
124 |
// Initialization |
|
125 |
static void initialize(); |
|
126 |
||
127 |
// Instruction support |
|
128 |
static bool has_v8() { return (_features & v8_instructions_m) != 0; } |
|
129 |
static bool has_v9() { return (_features & v9_instructions_m) != 0; } |
|
2253
30268d00878e
6812587: Use auxv to determine SPARC hardware features on Solaris
twisti
parents:
670
diff
changeset
|
130 |
static bool has_hardware_mul32() { return (_features & hardware_mul32_m) != 0; } |
30268d00878e
6812587: Use auxv to determine SPARC hardware features on Solaris
twisti
parents:
670
diff
changeset
|
131 |
static bool has_hardware_div32() { return (_features & hardware_div32_m) != 0; } |
1 | 132 |
static bool has_hardware_fsmuld() { return (_features & hardware_fsmuld_m) != 0; } |
2255
54abdf3e1055
6378821: bitCount() should use POPC on SPARC processors and AMD+10h
twisti
parents:
2253
diff
changeset
|
133 |
static bool has_hardware_popc() { return (_features & hardware_popc_m) != 0; } |
1 | 134 |
static bool has_vis1() { return (_features & vis1_instructions_m) != 0; } |
135 |
static bool has_vis2() { return (_features & vis2_instructions_m) != 0; } |
|
7704 | 136 |
static bool has_vis3() { return (_features & vis3_instructions_m) != 0; } |
7115
32300e243300
6987135: Performance regression on Intel platform with 32-bits edition between 6u13 and 6u14.
kvn
parents:
5547
diff
changeset
|
137 |
static bool has_blk_init() { return (_features & blk_init_instructions_m) != 0; } |
10252 | 138 |
static bool has_cbcond() { return (_features & cbcond_instructions_m) != 0; } |
22554
a19b9cf9ffa8
8031290: Adjust call to getisax() for additional words returned
jmasa
parents:
22505
diff
changeset
|
139 |
static bool has_sparc5_instr() { return (_features & sparc5_instructions_m) != 0; } |
22505 | 140 |
static bool has_aes() { return (_features & aes_instructions_m) != 0; } |
24953
9680119572be
8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents:
22554
diff
changeset
|
141 |
static bool has_sha1() { return (_features & sha1_instruction_m) != 0; } |
9680119572be
8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents:
22554
diff
changeset
|
142 |
static bool has_sha256() { return (_features & sha256_instruction_m) != 0; } |
9680119572be
8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents:
22554
diff
changeset
|
143 |
static bool has_sha512() { return (_features & sha512_instruction_m) != 0; } |
1 | 144 |
|
145 |
static bool supports_compare_and_exchange() |
|
146 |
{ return has_v9(); } |
|
147 |
||
7704 | 148 |
// Returns true if the platform is in the niagara line (T series) |
149 |
// and newer than the niagara1. |
|
150 |
static bool is_niagara_plus() { return is_T_family(_features) && !is_T1_model(_features); } |
|
13888
93dce24e57e5
7188176: The JVM should differentiate between T and M series and adjust GC ergonomics
twisti
parents:
13394
diff
changeset
|
151 |
|
93dce24e57e5
7188176: The JVM should differentiate between T and M series and adjust GC ergonomics
twisti
parents:
13394
diff
changeset
|
152 |
static bool is_M_series() { return is_M_family(_features); } |
10267 | 153 |
static bool is_T4() { return is_T_family(_features) && has_cbcond(); } |
22554
a19b9cf9ffa8
8031290: Adjust call to getisax() for additional words returned
jmasa
parents:
22505
diff
changeset
|
154 |
static bool is_T7() { return is_T_family(_features) && has_sparc5_instr(); } |
10252 | 155 |
|
7704 | 156 |
// Fujitsu SPARC64 |
157 |
static bool is_sparc64() { return (_features & sparc64_family_m) != 0; } |
|
1 | 158 |
|
10252 | 159 |
static bool is_sun4v() { return (_features & sun4v_m) != 0; } |
160 |
static bool is_ultra3() { return (_features & ultra3_m) == ultra3_m && !is_sun4v() && !is_sparc64(); } |
|
161 |
||
7704 | 162 |
static bool has_fast_fxtof() { return is_niagara() || is_sparc64() || has_v9() && !is_ultra3(); } |
163 |
static bool has_fast_idiv() { return is_niagara_plus() || is_sparc64(); } |
|
10267 | 164 |
|
10252 | 165 |
// T4 and newer Sparc have fast RDPC instruction. |
10267 | 166 |
static bool has_fast_rdpc() { return is_T4(); } |
167 |
||
10501 | 168 |
// On T4 and newer Sparc BIS to the beginning of cache line always zeros it. |
169 |
static bool has_block_zeroing() { return has_blk_init() && is_T4(); } |
|
1 | 170 |
|
171 |
static const char* cpu_features() { return _features_str; } |
|
172 |
||
26579
522d6486f410
8056124: Hotspot should use PICL interface to get cacheline size on SPARC
iveresov
parents:
24953
diff
changeset
|
173 |
// default prefetch block size on sparc |
522d6486f410
8056124: Hotspot should use PICL interface to get cacheline size on SPARC
iveresov
parents:
24953
diff
changeset
|
174 |
static intx prefetch_data_size() { return L2_cache_line_size(); } |
1 | 175 |
|
176 |
// Prefetch |
|
177 |
static intx prefetch_copy_interval_in_bytes() { |
|
178 |
intx interval = PrefetchCopyIntervalInBytes; |
|
179 |
return interval >= 0 ? interval : (has_v9() ? 512 : 0); |
|
180 |
} |
|
181 |
static intx prefetch_scan_interval_in_bytes() { |
|
182 |
intx interval = PrefetchScanIntervalInBytes; |
|
183 |
return interval >= 0 ? interval : (has_v9() ? 512 : 0); |
|
184 |
} |
|
185 |
static intx prefetch_fields_ahead() { |
|
186 |
intx count = PrefetchFieldsAhead; |
|
187 |
return count >= 0 ? count : (is_ultra3() ? 1 : 0); |
|
188 |
} |
|
189 |
||
190 |
static intx allocate_prefetch_distance() { |
|
191 |
// This method should be called before allocate_prefetch_style(). |
|
192 |
intx count = AllocatePrefetchDistance; |
|
193 |
if (count < 0) { // default is not defined ? |
|
194 |
count = 512; |
|
195 |
} |
|
196 |
return count; |
|
197 |
} |
|
198 |
static intx allocate_prefetch_style() { |
|
199 |
assert(AllocatePrefetchStyle >= 0, "AllocatePrefetchStyle should be positive"); |
|
200 |
// Return 0 if AllocatePrefetchDistance was not defined. |
|
201 |
return AllocatePrefetchDistance > 0 ? AllocatePrefetchStyle : 0; |
|
202 |
} |
|
203 |
||
204 |
// Assembler testing |
|
205 |
static void allow_all(); |
|
206 |
static void revert(); |
|
207 |
||
208 |
// Override the Abstract_VM_Version implementation. |
|
209 |
static uint page_size_count() { return is_sun4v() ? 4 : 2; } |
|
183
ba55c7f3fd45
6362677: Change parallel GC collector default number of parallel GC threads.
jmasa
parents:
1
diff
changeset
|
210 |
|
ba55c7f3fd45
6362677: Change parallel GC collector default number of parallel GC threads.
jmasa
parents:
1
diff
changeset
|
211 |
// Calculates the number of parallel threads |
ba55c7f3fd45
6362677: Change parallel GC collector default number of parallel GC threads.
jmasa
parents:
1
diff
changeset
|
212 |
static unsigned int calc_parallel_worker_threads(); |
1 | 213 |
}; |
7397 | 214 |
|
215 |
#endif // CPU_SPARC_VM_VM_VERSION_SPARC_HPP |