33066
|
1 |
/*
|
54249
|
2 |
* Copyright (c) 2015, 2019, Oracle and/or its affiliates. All rights reserved.
|
33066
|
3 |
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
|
|
4 |
*
|
|
5 |
* This code is free software; you can redistribute it and/or modify it
|
|
6 |
* under the terms of the GNU General Public License version 2 only, as
|
|
7 |
* published by the Free Software Foundation.
|
|
8 |
*
|
|
9 |
* This code is distributed in the hope that it will be useful, but WITHOUT
|
|
10 |
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
11 |
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
12 |
* version 2 for more details (a copy is included in the LICENSE file that
|
|
13 |
* accompanied this code).
|
|
14 |
*
|
|
15 |
* You should have received a copy of the GNU General Public License version
|
|
16 |
* 2 along with this work; if not, write to the Free Software Foundation,
|
|
17 |
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
18 |
*
|
|
19 |
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
|
|
20 |
* or visit www.oracle.com if you need additional information or have any
|
|
21 |
* questions.
|
|
22 |
*
|
|
23 |
*/
|
|
24 |
|
54249
|
25 |
#ifndef CPU_X86_CRC32C_H
|
|
26 |
#define CPU_X86_CRC32C_H
|
|
27 |
|
33066
|
28 |
enum {
|
|
29 |
// S. Gueron / Information Processing Letters 112 (2012) 184
|
|
30 |
// shows than anything above 6K and below 32K is a good choice
|
|
31 |
// 32K does not deliver any further performance gains
|
|
32 |
// 6K=8*256 (*3 as we compute 3 blocks together)
|
|
33 |
//
|
|
34 |
// Thus selecting the smallest value so it could apply to the largest number
|
|
35 |
// of buffer sizes.
|
|
36 |
CRC32C_HIGH = 8 * 256,
|
|
37 |
|
|
38 |
// empirical
|
|
39 |
// based on ubench study using methodology described in
|
|
40 |
// V. Gopal et al. / Fast CRC Computation for iSCSI Polynomial Using CRC32 Instruction April 2011 8
|
|
41 |
//
|
|
42 |
// arbitrary value between 27 and 256
|
|
43 |
CRC32C_MIDDLE = 8 * 86,
|
|
44 |
|
|
45 |
// V. Gopal et al. / Fast CRC Computation for iSCSI Polynomial Using CRC32 Instruction April 2011 9
|
|
46 |
// shows that 240 and 1024 are equally good choices as the 216==8*27
|
|
47 |
//
|
|
48 |
// Selecting the smallest value which resulted in a significant performance improvement over
|
|
49 |
// sequential version
|
|
50 |
CRC32C_LOW = 8 * 27,
|
|
51 |
|
|
52 |
CRC32C_NUM_ChunkSizeInBytes = 3,
|
|
53 |
|
|
54 |
// We need to compute powers of 64N and 128N for each "chunk" size
|
|
55 |
CRC32C_NUM_PRECOMPUTED_CONSTANTS = ( 2 * CRC32C_NUM_ChunkSizeInBytes )
|
|
56 |
};
|
|
57 |
// Notes:
|
|
58 |
// 1. Why we need to choose a "chunk" approach?
|
|
59 |
// Overhead of computing a powers and powers of for an arbitrary buffer of size N is significant
|
|
60 |
// (implementation approaches a library perf.)
|
|
61 |
// 2. Why only 3 "chunks"?
|
|
62 |
// Performance experiments results showed that a HIGH+LOW was not delivering a stable speedup
|
|
63 |
// curve.
|
|
64 |
//
|
|
65 |
// Disclaimer:
|
|
66 |
// If you ever decide to increase/decrease number of "chunks" be sure to modify
|
|
67 |
// a) constants table generation (hotspot/src/cpu/x86/vm/stubRoutines_x86.cpp)
|
|
68 |
// b) constant fetch from that table (macroAssembler_x86.cpp)
|
|
69 |
// c) unrolled for loop (macroAssembler_x86.cpp)
|
54249
|
70 |
|
|
71 |
#endif /* !CPU_X86_CRC32C_H */
|