1 /* 2 * Copyright (c) 2013, 2021, Oracle and/or its affiliates. All rights reserved. 3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. 4 * 5 * This code is free software; you can redistribute it and/or modify it 6 * under the terms of the GNU General Public License version 2 only, as 7 * published by the Free Software Foundation. 8 * 9 * This code is distributed in the hope that it will be useful, but WITHOUT 10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License 12 * version 2 for more details (a copy is included in the LICENSE file that 13 * accompanied this code). 14 * 15 * You should have received a copy of the GNU General Public License version 16 * 2 along with this work; if not, write to the Free Software Foundation, 17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. 18 * 19 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA 20 * or visit www.oracle.com if you need additional information or have any 21 * questions. 22 * 23 */ 24 25 #include "precompiled.hpp" 26 #include "runtime/deoptimization.hpp" 27 #include "runtime/frame.inline.hpp" 28 #include "runtime/stubRoutines.hpp" 29 #include "runtime/thread.inline.hpp" 30 #include "utilities/globalDefinitions.hpp" 31 #include "crc32c.h" 32 33 // Implementation of the platform-specific part of StubRoutines - for 34 // a description of how to extend it, see the stubRoutines.hpp file. 35 36 address StubRoutines::x86::_verify_mxcsr_entry = NULL; 37 address StubRoutines::x86::_key_shuffle_mask_addr = NULL; 38 address StubRoutines::x86::_counter_shuffle_mask_addr = NULL; 39 address StubRoutines::x86::_ghash_long_swap_mask_addr = NULL; 40 address StubRoutines::x86::_ghash_byte_swap_mask_addr = NULL; 41 address StubRoutines::x86::_ghash_poly_addr = NULL; 42 address StubRoutines::x86::_ghash_shuffmask_addr = NULL; 43 address StubRoutines::x86::_upper_word_mask_addr = NULL; 44 address StubRoutines::x86::_shuffle_byte_flip_mask_addr = NULL; 45 address StubRoutines::x86::_k256_adr = NULL; 46 address StubRoutines::x86::_vector_short_to_byte_mask = NULL; 47 address StubRoutines::x86::_vector_int_to_byte_mask = NULL; 48 address StubRoutines::x86::_vector_int_to_short_mask = NULL; 49 address StubRoutines::x86::_vector_all_bits_set = NULL; 50 address StubRoutines::x86::_vector_byte_shuffle_mask = NULL; 51 address StubRoutines::x86::_vector_short_shuffle_mask = NULL; 52 address StubRoutines::x86::_vector_int_shuffle_mask = NULL; 53 address StubRoutines::x86::_vector_long_shuffle_mask = NULL; 54 address StubRoutines::x86::_vector_float_sign_mask = NULL; 55 address StubRoutines::x86::_vector_float_sign_flip = NULL; 56 address StubRoutines::x86::_vector_double_sign_mask = NULL; 57 address StubRoutines::x86::_vector_double_sign_flip = NULL; 58 address StubRoutines::x86::_vector_byte_perm_mask = NULL; 59 address StubRoutines::x86::_vector_long_sign_mask = NULL; 60 address StubRoutines::x86::_vector_iota_indices = NULL; 61 address StubRoutines::x86::_vector_32_bit_mask = NULL; 62 address StubRoutines::x86::_vector_64_bit_mask = NULL; 63 #ifdef _LP64 64 address StubRoutines::x86::_k256_W_adr = NULL; 65 address StubRoutines::x86::_k512_W_addr = NULL; 66 address StubRoutines::x86::_pshuffle_byte_flip_mask_addr_sha512 = NULL; 67 // Base64 masks 68 address StubRoutines::x86::_encoding_table_base64 = NULL; 69 address StubRoutines::x86::_shuffle_base64 = NULL; 70 address StubRoutines::x86::_avx2_shuffle_base64 = NULL; 71 address StubRoutines::x86::_avx2_input_mask_base64 = NULL; 72 address StubRoutines::x86::_avx2_lut_base64 = NULL; 73 address StubRoutines::x86::_counter_mask_addr = NULL; 74 address StubRoutines::x86::_lookup_lo_base64 = NULL; 75 address StubRoutines::x86::_lookup_hi_base64 = NULL; 76 address StubRoutines::x86::_lookup_lo_base64url = NULL; 77 address StubRoutines::x86::_lookup_hi_base64url = NULL; 78 address StubRoutines::x86::_pack_vec_base64 = NULL; 79 address StubRoutines::x86::_join_0_1_base64 = NULL; 80 address StubRoutines::x86::_join_1_2_base64 = NULL; 81 address StubRoutines::x86::_join_2_3_base64 = NULL; 82 address StubRoutines::x86::_decoding_table_base64 = NULL; 83 #endif 84 address StubRoutines::x86::_pshuffle_byte_flip_mask_addr = NULL; 85 address StubRoutines::x86::_check_lock_stack = NULL; 86 87 //tables common for sin and cos 88 address StubRoutines::x86::_ONEHALF_adr = NULL; 89 address StubRoutines::x86::_P_2_adr = NULL; 90 address StubRoutines::x86::_SC_4_adr = NULL; 91 address StubRoutines::x86::_Ctable_adr = NULL; 92 address StubRoutines::x86::_SC_2_adr = NULL; 93 address StubRoutines::x86::_SC_3_adr = NULL; 94 address StubRoutines::x86::_SC_1_adr = NULL; 95 address StubRoutines::x86::_PI_INV_TABLE_adr = NULL; 96 address StubRoutines::x86::_PI_4_adr = NULL; 97 address StubRoutines::x86::_PI32INV_adr = NULL; 98 address StubRoutines::x86::_SIGN_MASK_adr = NULL; 99 address StubRoutines::x86::_P_1_adr = NULL; 100 address StubRoutines::x86::_P_3_adr = NULL; 101 address StubRoutines::x86::_NEG_ZERO_adr = NULL; 102 103 //tables common for sincos and tancot 104 address StubRoutines::x86::_L_2il0floatpacket_0_adr = NULL; 105 address StubRoutines::x86::_Pi4Inv_adr = NULL; 106 address StubRoutines::x86::_Pi4x3_adr = NULL; 107 address StubRoutines::x86::_Pi4x4_adr = NULL; 108 address StubRoutines::x86::_ones_adr = NULL; 109 110 uint64_t StubRoutines::x86::_crc_by128_masks[] = 111 { 112 /* The fields in this structure are arranged so that they can be 113 * picked up two at a time with 128-bit loads. 114 * 115 * Because of flipped bit order for this CRC polynomials 116 * the constant for X**N is left-shifted by 1. This is because 117 * a 64 x 64 polynomial multiply produces a 127-bit result 118 * but the highest term is always aligned to bit 0 in the container. 119 * Pre-shifting by one fixes this, at the cost of potentially making 120 * the 32-bit constant no longer fit in a 32-bit container (thus the 121 * use of uint64_t, though this is also the size used by the carry- 122 * less multiply instruction. 123 * 124 * In addition, the flipped bit order and highest-term-at-least-bit 125 * multiply changes the constants used. The 96-bit result will be 126 * aligned to the high-term end of the target 128-bit container, 127 * not the low-term end; that is, instead of a 512-bit or 576-bit fold, 128 * instead it is a 480 (=512-32) or 544 (=512+64-32) bit fold. 129 * 130 * This cause additional problems in the 128-to-64-bit reduction; see the 131 * code for details. By storing a mask in the otherwise unused half of 132 * a 128-bit constant, bits can be cleared before multiplication without 133 * storing and reloading. Note that staying on a 128-bit datapath means 134 * that some data is uselessly stored and some unused data is intersected 135 * with an irrelevant constant. 136 */ 137 138 ((uint64_t) 0xffffffffUL), /* low of K_M_64 */ 139 ((uint64_t) 0xb1e6b092U << 1), /* high of K_M_64 */ 140 ((uint64_t) 0xba8ccbe8U << 1), /* low of K_160_96 */ 141 ((uint64_t) 0x6655004fU << 1), /* high of K_160_96 */ 142 ((uint64_t) 0xaa2215eaU << 1), /* low of K_544_480 */ 143 ((uint64_t) 0xe3720acbU << 1) /* high of K_544_480 */ 144 }; 145 146 /** 147 * crc_table[] from jdk/src/share/native/java/util/zip/zlib-1.2.5/crc32.h 148 */ 149 juint StubRoutines::x86::_crc_table[] = 150 { 151 0x00000000UL, 0x77073096UL, 0xee0e612cUL, 0x990951baUL, 0x076dc419UL, 152 0x706af48fUL, 0xe963a535UL, 0x9e6495a3UL, 0x0edb8832UL, 0x79dcb8a4UL, 153 0xe0d5e91eUL, 0x97d2d988UL, 0x09b64c2bUL, 0x7eb17cbdUL, 0xe7b82d07UL, 154 0x90bf1d91UL, 0x1db71064UL, 0x6ab020f2UL, 0xf3b97148UL, 0x84be41deUL, 155 0x1adad47dUL, 0x6ddde4ebUL, 0xf4d4b551UL, 0x83d385c7UL, 0x136c9856UL, 156 0x646ba8c0UL, 0xfd62f97aUL, 0x8a65c9ecUL, 0x14015c4fUL, 0x63066cd9UL, 157 0xfa0f3d63UL, 0x8d080df5UL, 0x3b6e20c8UL, 0x4c69105eUL, 0xd56041e4UL, 158 0xa2677172UL, 0x3c03e4d1UL, 0x4b04d447UL, 0xd20d85fdUL, 0xa50ab56bUL, 159 0x35b5a8faUL, 0x42b2986cUL, 0xdbbbc9d6UL, 0xacbcf940UL, 0x32d86ce3UL, 160 0x45df5c75UL, 0xdcd60dcfUL, 0xabd13d59UL, 0x26d930acUL, 0x51de003aUL, 161 0xc8d75180UL, 0xbfd06116UL, 0x21b4f4b5UL, 0x56b3c423UL, 0xcfba9599UL, 162 0xb8bda50fUL, 0x2802b89eUL, 0x5f058808UL, 0xc60cd9b2UL, 0xb10be924UL, 163 0x2f6f7c87UL, 0x58684c11UL, 0xc1611dabUL, 0xb6662d3dUL, 0x76dc4190UL, 164 0x01db7106UL, 0x98d220bcUL, 0xefd5102aUL, 0x71b18589UL, 0x06b6b51fUL, 165 0x9fbfe4a5UL, 0xe8b8d433UL, 0x7807c9a2UL, 0x0f00f934UL, 0x9609a88eUL, 166 0xe10e9818UL, 0x7f6a0dbbUL, 0x086d3d2dUL, 0x91646c97UL, 0xe6635c01UL, 167 0x6b6b51f4UL, 0x1c6c6162UL, 0x856530d8UL, 0xf262004eUL, 0x6c0695edUL, 168 0x1b01a57bUL, 0x8208f4c1UL, 0xf50fc457UL, 0x65b0d9c6UL, 0x12b7e950UL, 169 0x8bbeb8eaUL, 0xfcb9887cUL, 0x62dd1ddfUL, 0x15da2d49UL, 0x8cd37cf3UL, 170 0xfbd44c65UL, 0x4db26158UL, 0x3ab551ceUL, 0xa3bc0074UL, 0xd4bb30e2UL, 171 0x4adfa541UL, 0x3dd895d7UL, 0xa4d1c46dUL, 0xd3d6f4fbUL, 0x4369e96aUL, 172 0x346ed9fcUL, 0xad678846UL, 0xda60b8d0UL, 0x44042d73UL, 0x33031de5UL, 173 0xaa0a4c5fUL, 0xdd0d7cc9UL, 0x5005713cUL, 0x270241aaUL, 0xbe0b1010UL, 174 0xc90c2086UL, 0x5768b525UL, 0x206f85b3UL, 0xb966d409UL, 0xce61e49fUL, 175 0x5edef90eUL, 0x29d9c998UL, 0xb0d09822UL, 0xc7d7a8b4UL, 0x59b33d17UL, 176 0x2eb40d81UL, 0xb7bd5c3bUL, 0xc0ba6cadUL, 0xedb88320UL, 0x9abfb3b6UL, 177 0x03b6e20cUL, 0x74b1d29aUL, 0xead54739UL, 0x9dd277afUL, 0x04db2615UL, 178 0x73dc1683UL, 0xe3630b12UL, 0x94643b84UL, 0x0d6d6a3eUL, 0x7a6a5aa8UL, 179 0xe40ecf0bUL, 0x9309ff9dUL, 0x0a00ae27UL, 0x7d079eb1UL, 0xf00f9344UL, 180 0x8708a3d2UL, 0x1e01f268UL, 0x6906c2feUL, 0xf762575dUL, 0x806567cbUL, 181 0x196c3671UL, 0x6e6b06e7UL, 0xfed41b76UL, 0x89d32be0UL, 0x10da7a5aUL, 182 0x67dd4accUL, 0xf9b9df6fUL, 0x8ebeeff9UL, 0x17b7be43UL, 0x60b08ed5UL, 183 0xd6d6a3e8UL, 0xa1d1937eUL, 0x38d8c2c4UL, 0x4fdff252UL, 0xd1bb67f1UL, 184 0xa6bc5767UL, 0x3fb506ddUL, 0x48b2364bUL, 0xd80d2bdaUL, 0xaf0a1b4cUL, 185 0x36034af6UL, 0x41047a60UL, 0xdf60efc3UL, 0xa867df55UL, 0x316e8eefUL, 186 0x4669be79UL, 0xcb61b38cUL, 0xbc66831aUL, 0x256fd2a0UL, 0x5268e236UL, 187 0xcc0c7795UL, 0xbb0b4703UL, 0x220216b9UL, 0x5505262fUL, 0xc5ba3bbeUL, 188 0xb2bd0b28UL, 0x2bb45a92UL, 0x5cb36a04UL, 0xc2d7ffa7UL, 0xb5d0cf31UL, 189 0x2cd99e8bUL, 0x5bdeae1dUL, 0x9b64c2b0UL, 0xec63f226UL, 0x756aa39cUL, 190 0x026d930aUL, 0x9c0906a9UL, 0xeb0e363fUL, 0x72076785UL, 0x05005713UL, 191 0x95bf4a82UL, 0xe2b87a14UL, 0x7bb12baeUL, 0x0cb61b38UL, 0x92d28e9bUL, 192 0xe5d5be0dUL, 0x7cdcefb7UL, 0x0bdbdf21UL, 0x86d3d2d4UL, 0xf1d4e242UL, 193 0x68ddb3f8UL, 0x1fda836eUL, 0x81be16cdUL, 0xf6b9265bUL, 0x6fb077e1UL, 194 0x18b74777UL, 0x88085ae6UL, 0xff0f6a70UL, 0x66063bcaUL, 0x11010b5cUL, 195 0x8f659effUL, 0xf862ae69UL, 0x616bffd3UL, 0x166ccf45UL, 0xa00ae278UL, 196 0xd70dd2eeUL, 0x4e048354UL, 0x3903b3c2UL, 0xa7672661UL, 0xd06016f7UL, 197 0x4969474dUL, 0x3e6e77dbUL, 0xaed16a4aUL, 0xd9d65adcUL, 0x40df0b66UL, 198 0x37d83bf0UL, 0xa9bcae53UL, 0xdebb9ec5UL, 0x47b2cf7fUL, 0x30b5ffe9UL, 199 0xbdbdf21cUL, 0xcabac28aUL, 0x53b39330UL, 0x24b4a3a6UL, 0xbad03605UL, 200 0xcdd70693UL, 0x54de5729UL, 0x23d967bfUL, 0xb3667a2eUL, 0xc4614ab8UL, 201 0x5d681b02UL, 0x2a6f2b94UL, 0xb40bbe37UL, 0xc30c8ea1UL, 0x5a05df1bUL, 202 0x2d02ef8dUL 203 }; 204 205 #ifdef _LP64 206 juint StubRoutines::x86::_crc_table_avx512[] = 207 { 208 0xe95c1271UL, 0x00000000UL, 0xce3371cbUL, 0x00000000UL, 209 0xccaa009eUL, 0x00000000UL, 0x751997d0UL, 0x00000001UL, 210 0x4a7fe880UL, 0x00000001UL, 0xe88ef372UL, 0x00000001UL, 211 0xccaa009eUL, 0x00000000UL, 0x63cd6124UL, 0x00000001UL, 212 0xf7011640UL, 0x00000001UL, 0xdb710640UL, 0x00000001UL, 213 0xd7cfc6acUL, 0x00000001UL, 0xea89367eUL, 0x00000001UL, 214 0x8cb44e58UL, 0x00000001UL, 0xdf068dc2UL, 0x00000000UL, 215 0xae0b5394UL, 0x00000000UL, 0xc7569e54UL, 0x00000001UL, 216 0xc6e41596UL, 0x00000001UL, 0x54442bd4UL, 0x00000001UL, 217 0x74359406UL, 0x00000001UL, 0x3db1ecdcUL, 0x00000000UL, 218 0x5a546366UL, 0x00000001UL, 0xf1da05aaUL, 0x00000000UL, 219 0xccaa009eUL, 0x00000000UL, 0x751997d0UL, 0x00000001UL, 220 0x00000000UL, 0x00000000UL, 0x00000000UL, 0x00000000UL 221 }; 222 223 juint StubRoutines::x86::_crc32c_table_avx512[] = 224 { 225 0xb9e02b86UL, 0x00000000UL, 0xdcb17aa4UL, 0x00000000UL, 226 0x493c7d27UL, 0x00000000UL, 0xc1068c50UL, 0x0000000eUL, 227 0x06e38d70UL, 0x00000002UL, 0x6992cea2UL, 0x00000000UL, 228 0x493c7d27UL, 0x00000000UL, 0xdd45aab8UL, 0x00000000UL, 229 0xdea713f0UL, 0x00000000UL, 0x05ec76f0UL, 0x00000001UL, 230 0x47db8317UL, 0x00000000UL, 0x2ad91c30UL, 0x00000000UL, 231 0x0715ce53UL, 0x00000000UL, 0xc49f4f67UL, 0x00000000UL, 232 0x39d3b296UL, 0x00000000UL, 0x083a6eecUL, 0x00000000UL, 233 0x9e4addf8UL, 0x00000000UL, 0x740eef02UL, 0x00000000UL, 234 0xddc0152bUL, 0x00000000UL, 0x1c291d04UL, 0x00000000UL, 235 0xba4fc28eUL, 0x00000000UL, 0x3da6d0cbUL, 0x00000000UL, 236 0x493c7d27UL, 0x00000000UL, 0xc1068c50UL, 0x0000000eUL, 237 0x00000000UL, 0x00000000UL, 0x00000000UL, 0x00000000UL 238 }; 239 240 juint StubRoutines::x86::_crc_by128_masks_avx512[] = 241 { 242 0xffffffffUL, 0xffffffffUL, 0x00000000UL, 0x00000000UL, 243 0x00000000UL, 0xffffffffUL, 0xffffffffUL, 0xffffffffUL, 244 0x80808080UL, 0x80808080UL, 0x80808080UL, 0x80808080UL 245 }; 246 247 juint StubRoutines::x86::_shuf_table_crc32_avx512[] = 248 { 249 0x83828100UL, 0x87868584UL, 0x8b8a8988UL, 0x8f8e8d8cUL, 250 0x03020100UL, 0x07060504UL, 0x0b0a0908UL, 0x000e0d0cUL 251 }; 252 253 juint StubRoutines::x86::_adler32_ascale_table[] = 254 { 255 0x00000000UL, 0x00000001UL, 0x00000002UL, 0x00000003UL, 256 0x00000004UL, 0x00000005UL, 0x00000006UL, 0x00000007UL 257 }; 258 259 juint StubRoutines::x86::_adler32_shuf0_table[] = 260 { 261 0xFFFFFF00UL, 0xFFFFFF01UL, 0xFFFFFF02UL, 0xFFFFFF03UL, 262 0xFFFFFF04UL, 0xFFFFFF05UL, 0xFFFFFF06UL, 0xFFFFFF07UL 263 }; 264 265 juint StubRoutines::x86::_adler32_shuf1_table[] = 266 { 267 0xFFFFFF08UL, 0xFFFFFF09, 0xFFFFFF0AUL, 0xFFFFFF0BUL, 268 0xFFFFFF0CUL, 0xFFFFFF0D, 0xFFFFFF0EUL, 0xFFFFFF0FUL 269 }; 270 271 #endif // _LP64 272 273 #define D 32 274 #define P 0x82F63B78 // Reflection of Castagnoli (0x11EDC6F41) 275 276 #define TILL_CYCLE 31 277 uint32_t _crc32c_pow_2k_table[TILL_CYCLE]; // because _crc32c_pow_2k_table[TILL_CYCLE == 31] == _crc32c_pow_2k_table[0] 278 279 // A. Kadatch and B. Jenkins / Everything we know about CRC but afraid to forget September 3, 2010 8 280 // Listing 1: Multiplication of normalized polynomials 281 // "a" and "b" occupy D least significant bits. 282 uint32_t crc32c_multiply(uint32_t a, uint32_t b) { 283 uint32_t product = 0; 284 uint32_t b_pow_x_table[D + 1]; // b_pow_x_table[k] = (b * x**k) mod P 285 b_pow_x_table[0] = b; 286 for (int k = 0; k < D; ++k) { 287 // If "a" has non-zero coefficient at x**k,/ add ((b * x**k) mod P) to the result. 288 if ((a & (((uint32_t)1) << (D - 1 - k))) != 0) product ^= b_pow_x_table[k]; 289 290 // Compute b_pow_x_table[k+1] = (b ** x**(k+1)) mod P. 291 if (b_pow_x_table[k] & 1) { 292 // If degree of (b_pow_x_table[k] * x) is D, then 293 // degree of (b_pow_x_table[k] * x - P) is less than D. 294 b_pow_x_table[k + 1] = (b_pow_x_table[k] >> 1) ^ P; 295 } 296 else { 297 b_pow_x_table[k + 1] = b_pow_x_table[k] >> 1; 298 } 299 } 300 return product; 301 } 302 #undef D 303 #undef P 304 305 // A. Kadatch and B. Jenkins / Everything we know about CRC but afraid to forget September 3, 2010 9 306 void crc32c_init_pow_2k(void) { 307 // _crc32c_pow_2k_table(0) = 308 // x^(2^k) mod P(x) = x mod P(x) = x 309 // Since we are operating on a reflected values 310 // x = 10b, reflect(x) = 0x40000000 311 _crc32c_pow_2k_table[0] = 0x40000000; 312 313 for (int k = 1; k < TILL_CYCLE; k++) { 314 // _crc32c_pow_2k_table(k+1) = _crc32c_pow_2k_table(k-1)^2 mod P(x) 315 uint32_t tmp = _crc32c_pow_2k_table[k - 1]; 316 _crc32c_pow_2k_table[k] = crc32c_multiply(tmp, tmp); 317 } 318 } 319 320 // x^N mod P(x) 321 uint32_t crc32c_f_pow_n(uint32_t n) { 322 // result = 1 (polynomial) 323 uint32_t one, result = 0x80000000, i = 0; 324 325 while (one = (n & 1), (n == 1 || n - one > 0)) { 326 if (one) { 327 result = crc32c_multiply(result, _crc32c_pow_2k_table[i]); 328 } 329 n >>= 1; 330 i++; 331 } 332 333 return result; 334 } 335 336 juint *StubRoutines::x86::_crc32c_table; 337 338 void StubRoutines::x86::generate_CRC32C_table(bool is_pclmulqdq_table_supported) { 339 340 static juint pow_n[CRC32C_NUM_PRECOMPUTED_CONSTANTS]; 341 342 crc32c_init_pow_2k(); 343 344 pow_n[0] = crc32c_f_pow_n(CRC32C_HIGH * 8); // 8N * 8 = 64N 345 pow_n[1] = crc32c_f_pow_n(CRC32C_HIGH * 8 * 2); // 128N 346 347 pow_n[2] = crc32c_f_pow_n(CRC32C_MIDDLE * 8); 348 pow_n[3] = crc32c_f_pow_n(CRC32C_MIDDLE * 8 * 2); 349 350 pow_n[4] = crc32c_f_pow_n(CRC32C_LOW * 8); 351 pow_n[CRC32C_NUM_PRECOMPUTED_CONSTANTS - 1] = 352 crc32c_f_pow_n(CRC32C_LOW * 8 * 2); 353 354 if (is_pclmulqdq_table_supported) { 355 _crc32c_table = pow_n; 356 } else { 357 static julong pclmulqdq_table[CRC32C_NUM_PRECOMPUTED_CONSTANTS * 256]; 358 359 for (int j = 0; j < CRC32C_NUM_PRECOMPUTED_CONSTANTS; j++) { 360 static juint X_CONST = pow_n[j]; 361 for (int64_t i = 0; i < 256; i++) { // to force 64 bit wide computations 362 // S. Gueron / Information Processing Letters 112 (2012) 184 363 // Algorithm 3: Generating a carry-less multiplication lookup table. 364 // Input: A 32-bit constant, X_CONST. 365 // Output: A table of 256 entries, each one is a 64-bit quadword, 366 // that can be used for computing "byte" * X_CONST, for a given byte. 367 pclmulqdq_table[j * 256 + i] = 368 ((i & 1) * X_CONST) ^ ((i & 2) * X_CONST) ^ ((i & 4) * X_CONST) ^ 369 ((i & 8) * X_CONST) ^ ((i & 16) * X_CONST) ^ ((i & 32) * X_CONST) ^ 370 ((i & 64) * X_CONST) ^ ((i & 128) * X_CONST); 371 } 372 } 373 _crc32c_table = (juint*)pclmulqdq_table; 374 } 375 } 376 377 ATTRIBUTE_ALIGNED(64) juint StubRoutines::x86::_k256[] = 378 { 379 0x428a2f98UL, 0x71374491UL, 0xb5c0fbcfUL, 0xe9b5dba5UL, 380 0x3956c25bUL, 0x59f111f1UL, 0x923f82a4UL, 0xab1c5ed5UL, 381 0xd807aa98UL, 0x12835b01UL, 0x243185beUL, 0x550c7dc3UL, 382 0x72be5d74UL, 0x80deb1feUL, 0x9bdc06a7UL, 0xc19bf174UL, 383 0xe49b69c1UL, 0xefbe4786UL, 0x0fc19dc6UL, 0x240ca1ccUL, 384 0x2de92c6fUL, 0x4a7484aaUL, 0x5cb0a9dcUL, 0x76f988daUL, 385 0x983e5152UL, 0xa831c66dUL, 0xb00327c8UL, 0xbf597fc7UL, 386 0xc6e00bf3UL, 0xd5a79147UL, 0x06ca6351UL, 0x14292967UL, 387 0x27b70a85UL, 0x2e1b2138UL, 0x4d2c6dfcUL, 0x53380d13UL, 388 0x650a7354UL, 0x766a0abbUL, 0x81c2c92eUL, 0x92722c85UL, 389 0xa2bfe8a1UL, 0xa81a664bUL, 0xc24b8b70UL, 0xc76c51a3UL, 390 0xd192e819UL, 0xd6990624UL, 0xf40e3585UL, 0x106aa070UL, 391 0x19a4c116UL, 0x1e376c08UL, 0x2748774cUL, 0x34b0bcb5UL, 392 0x391c0cb3UL, 0x4ed8aa4aUL, 0x5b9cca4fUL, 0x682e6ff3UL, 393 0x748f82eeUL, 0x78a5636fUL, 0x84c87814UL, 0x8cc70208UL, 394 0x90befffaUL, 0xa4506cebUL, 0xbef9a3f7UL, 0xc67178f2UL 395 }; 396 397 #ifdef _LP64 398 // used in MacroAssembler::sha256_AVX2 399 // dynamically built from _k256 400 ATTRIBUTE_ALIGNED(64) juint StubRoutines::x86::_k256_W[2*sizeof(StubRoutines::x86::_k256)]; 401 402 // used in MacroAssembler::sha512_AVX2 403 ATTRIBUTE_ALIGNED(64) julong StubRoutines::x86::_k512_W[] = 404 { 405 0x428a2f98d728ae22ULL, 0x7137449123ef65cdULL, 406 0xb5c0fbcfec4d3b2fULL, 0xe9b5dba58189dbbcULL, 407 0x3956c25bf348b538ULL, 0x59f111f1b605d019ULL, 408 0x923f82a4af194f9bULL, 0xab1c5ed5da6d8118ULL, 409 0xd807aa98a3030242ULL, 0x12835b0145706fbeULL, 410 0x243185be4ee4b28cULL, 0x550c7dc3d5ffb4e2ULL, 411 0x72be5d74f27b896fULL, 0x80deb1fe3b1696b1ULL, 412 0x9bdc06a725c71235ULL, 0xc19bf174cf692694ULL, 413 0xe49b69c19ef14ad2ULL, 0xefbe4786384f25e3ULL, 414 0x0fc19dc68b8cd5b5ULL, 0x240ca1cc77ac9c65ULL, 415 0x2de92c6f592b0275ULL, 0x4a7484aa6ea6e483ULL, 416 0x5cb0a9dcbd41fbd4ULL, 0x76f988da831153b5ULL, 417 0x983e5152ee66dfabULL, 0xa831c66d2db43210ULL, 418 0xb00327c898fb213fULL, 0xbf597fc7beef0ee4ULL, 419 0xc6e00bf33da88fc2ULL, 0xd5a79147930aa725ULL, 420 0x06ca6351e003826fULL, 0x142929670a0e6e70ULL, 421 0x27b70a8546d22ffcULL, 0x2e1b21385c26c926ULL, 422 0x4d2c6dfc5ac42aedULL, 0x53380d139d95b3dfULL, 423 0x650a73548baf63deULL, 0x766a0abb3c77b2a8ULL, 424 0x81c2c92e47edaee6ULL, 0x92722c851482353bULL, 425 0xa2bfe8a14cf10364ULL, 0xa81a664bbc423001ULL, 426 0xc24b8b70d0f89791ULL, 0xc76c51a30654be30ULL, 427 0xd192e819d6ef5218ULL, 0xd69906245565a910ULL, 428 0xf40e35855771202aULL, 0x106aa07032bbd1b8ULL, 429 0x19a4c116b8d2d0c8ULL, 0x1e376c085141ab53ULL, 430 0x2748774cdf8eeb99ULL, 0x34b0bcb5e19b48a8ULL, 431 0x391c0cb3c5c95a63ULL, 0x4ed8aa4ae3418acbULL, 432 0x5b9cca4f7763e373ULL, 0x682e6ff3d6b2b8a3ULL, 433 0x748f82ee5defb2fcULL, 0x78a5636f43172f60ULL, 434 0x84c87814a1f0ab72ULL, 0x8cc702081a6439ecULL, 435 0x90befffa23631e28ULL, 0xa4506cebde82bde9ULL, 436 0xbef9a3f7b2c67915ULL, 0xc67178f2e372532bULL, 437 0xca273eceea26619cULL, 0xd186b8c721c0c207ULL, 438 0xeada7dd6cde0eb1eULL, 0xf57d4f7fee6ed178ULL, 439 0x06f067aa72176fbaULL, 0x0a637dc5a2c898a6ULL, 440 0x113f9804bef90daeULL, 0x1b710b35131c471bULL, 441 0x28db77f523047d84ULL, 0x32caab7b40c72493ULL, 442 0x3c9ebe0a15c9bebcULL, 0x431d67c49c100d4cULL, 443 0x4cc5d4becb3e42b6ULL, 0x597f299cfc657e2aULL, 444 0x5fcb6fab3ad6faecULL, 0x6c44198c4a475817ULL, 445 }; 446 #endif