1 /*
  2  * Copyright (c) 2013, 2021, Oracle and/or its affiliates. All rights reserved.
  3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
  4  *
  5  * This code is free software; you can redistribute it and/or modify it
  6  * under the terms of the GNU General Public License version 2 only, as
  7  * published by the Free Software Foundation.
  8  *
  9  * This code is distributed in the hope that it will be useful, but WITHOUT
 10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 12  * version 2 for more details (a copy is included in the LICENSE file that
 13  * accompanied this code).
 14  *
 15  * You should have received a copy of the GNU General Public License version
 16  * 2 along with this work; if not, write to the Free Software Foundation,
 17  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
 18  *
 19  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
 20  * or visit www.oracle.com if you need additional information or have any
 21  * questions.
 22  *
 23  */
 24 
 25 #include "precompiled.hpp"
 26 #include "runtime/deoptimization.hpp"
 27 #include "runtime/frame.inline.hpp"
 28 #include "runtime/stubRoutines.hpp"
 29 #include "runtime/thread.inline.hpp"
 30 #include "utilities/globalDefinitions.hpp"
 31 #include "crc32c.h"
 32 
 33 // Implementation of the platform-specific part of StubRoutines - for
 34 // a description of how to extend it, see the stubRoutines.hpp file.
 35 
 36 address StubRoutines::x86::_verify_mxcsr_entry = NULL;
 37 address StubRoutines::x86::_key_shuffle_mask_addr = NULL;
 38 address StubRoutines::x86::_counter_shuffle_mask_addr = NULL;
 39 address StubRoutines::x86::_ghash_long_swap_mask_addr = NULL;
 40 address StubRoutines::x86::_ghash_byte_swap_mask_addr = NULL;
 41 address StubRoutines::x86::_ghash_poly_addr = NULL;
 42 address StubRoutines::x86::_ghash_shuffmask_addr = NULL;
 43 address StubRoutines::x86::_upper_word_mask_addr = NULL;
 44 address StubRoutines::x86::_shuffle_byte_flip_mask_addr = NULL;
 45 address StubRoutines::x86::_k256_adr = NULL;
 46 address StubRoutines::x86::_vector_short_to_byte_mask = NULL;
 47 address StubRoutines::x86::_vector_int_to_byte_mask = NULL;
 48 address StubRoutines::x86::_vector_int_to_short_mask = NULL;
 49 address StubRoutines::x86::_vector_all_bits_set = NULL;
 50 address StubRoutines::x86::_vector_byte_shuffle_mask = NULL;
 51 address StubRoutines::x86::_vector_short_shuffle_mask = NULL;
 52 address StubRoutines::x86::_vector_int_shuffle_mask = NULL;
 53 address StubRoutines::x86::_vector_long_shuffle_mask = NULL;
 54 address StubRoutines::x86::_vector_float_sign_mask = NULL;
 55 address StubRoutines::x86::_vector_float_sign_flip = NULL;
 56 address StubRoutines::x86::_vector_double_sign_mask = NULL;
 57 address StubRoutines::x86::_vector_double_sign_flip = NULL;
 58 address StubRoutines::x86::_vector_byte_perm_mask = NULL;
 59 address StubRoutines::x86::_vector_long_sign_mask = NULL;
 60 address StubRoutines::x86::_vector_iota_indices = NULL;
 61 address StubRoutines::x86::_vector_32_bit_mask = NULL;
 62 address StubRoutines::x86::_vector_64_bit_mask = NULL;
 63 #ifdef _LP64
 64 address StubRoutines::x86::_k256_W_adr = NULL;
 65 address StubRoutines::x86::_k512_W_addr = NULL;
 66 address StubRoutines::x86::_pshuffle_byte_flip_mask_addr_sha512 = NULL;
 67 // Base64 masks
 68 address StubRoutines::x86::_encoding_table_base64 = NULL;
 69 address StubRoutines::x86::_shuffle_base64 = NULL;
 70 address StubRoutines::x86::_avx2_shuffle_base64 = NULL;
 71 address StubRoutines::x86::_avx2_input_mask_base64 = NULL;
 72 address StubRoutines::x86::_avx2_lut_base64 = NULL;
 73 address StubRoutines::x86::_counter_mask_addr = NULL;
 74 address StubRoutines::x86::_lookup_lo_base64 = NULL;
 75 address StubRoutines::x86::_lookup_hi_base64 = NULL;
 76 address StubRoutines::x86::_lookup_lo_base64url = NULL;
 77 address StubRoutines::x86::_lookup_hi_base64url = NULL;
 78 address StubRoutines::x86::_pack_vec_base64 = NULL;
 79 address StubRoutines::x86::_join_0_1_base64 = NULL;
 80 address StubRoutines::x86::_join_1_2_base64 = NULL;
 81 address StubRoutines::x86::_join_2_3_base64 = NULL;
 82 address StubRoutines::x86::_decoding_table_base64 = NULL;
 83 #endif
 84 address StubRoutines::x86::_pshuffle_byte_flip_mask_addr = NULL;
 85 
 86 //tables common for sin and cos
 87 address StubRoutines::x86::_ONEHALF_adr = NULL;
 88 address StubRoutines::x86::_P_2_adr = NULL;
 89 address StubRoutines::x86::_SC_4_adr = NULL;
 90 address StubRoutines::x86::_Ctable_adr = NULL;
 91 address StubRoutines::x86::_SC_2_adr = NULL;
 92 address StubRoutines::x86::_SC_3_adr = NULL;
 93 address StubRoutines::x86::_SC_1_adr = NULL;
 94 address StubRoutines::x86::_PI_INV_TABLE_adr = NULL;
 95 address StubRoutines::x86::_PI_4_adr = NULL;
 96 address StubRoutines::x86::_PI32INV_adr = NULL;
 97 address StubRoutines::x86::_SIGN_MASK_adr = NULL;
 98 address StubRoutines::x86::_P_1_adr = NULL;
 99 address StubRoutines::x86::_P_3_adr = NULL;
100 address StubRoutines::x86::_NEG_ZERO_adr = NULL;
101 
102 //tables common for sincos and tancot
103 address StubRoutines::x86::_L_2il0floatpacket_0_adr = NULL;
104 address StubRoutines::x86::_Pi4Inv_adr = NULL;
105 address StubRoutines::x86::_Pi4x3_adr = NULL;
106 address StubRoutines::x86::_Pi4x4_adr = NULL;
107 address StubRoutines::x86::_ones_adr = NULL;
108 
109 uint64_t StubRoutines::x86::_crc_by128_masks[] =
110 {
111   /* The fields in this structure are arranged so that they can be
112    * picked up two at a time with 128-bit loads.
113    *
114    * Because of flipped bit order for this CRC polynomials
115    * the constant for X**N is left-shifted by 1.  This is because
116    * a 64 x 64 polynomial multiply produces a 127-bit result
117    * but the highest term is always aligned to bit 0 in the container.
118    * Pre-shifting by one fixes this, at the cost of potentially making
119    * the 32-bit constant no longer fit in a 32-bit container (thus the
120    * use of uint64_t, though this is also the size used by the carry-
121    * less multiply instruction.
122    *
123    * In addition, the flipped bit order and highest-term-at-least-bit
124    * multiply changes the constants used.  The 96-bit result will be
125    * aligned to the high-term end of the target 128-bit container,
126    * not the low-term end; that is, instead of a 512-bit or 576-bit fold,
127    * instead it is a 480 (=512-32) or 544 (=512+64-32) bit fold.
128    *
129    * This cause additional problems in the 128-to-64-bit reduction; see the
130    * code for details.  By storing a mask in the otherwise unused half of
131    * a 128-bit constant, bits can be cleared before multiplication without
132    * storing and reloading.  Note that staying on a 128-bit datapath means
133    * that some data is uselessly stored and some unused data is intersected
134    * with an irrelevant constant.
135    */
136 
137   ((uint64_t) 0xffffffffUL),     /* low  of K_M_64    */
138   ((uint64_t) 0xb1e6b092U << 1), /* high of K_M_64    */
139   ((uint64_t) 0xba8ccbe8U << 1), /* low  of K_160_96  */
140   ((uint64_t) 0x6655004fU << 1), /* high of K_160_96  */
141   ((uint64_t) 0xaa2215eaU << 1), /* low  of K_544_480 */
142   ((uint64_t) 0xe3720acbU << 1)  /* high of K_544_480 */
143 };
144 
145 /**
146  *  crc_table[] from jdk/src/share/native/java/util/zip/zlib-1.2.5/crc32.h
147  */
148 juint StubRoutines::x86::_crc_table[] =
149 {
150     0x00000000UL, 0x77073096UL, 0xee0e612cUL, 0x990951baUL, 0x076dc419UL,
151     0x706af48fUL, 0xe963a535UL, 0x9e6495a3UL, 0x0edb8832UL, 0x79dcb8a4UL,
152     0xe0d5e91eUL, 0x97d2d988UL, 0x09b64c2bUL, 0x7eb17cbdUL, 0xe7b82d07UL,
153     0x90bf1d91UL, 0x1db71064UL, 0x6ab020f2UL, 0xf3b97148UL, 0x84be41deUL,
154     0x1adad47dUL, 0x6ddde4ebUL, 0xf4d4b551UL, 0x83d385c7UL, 0x136c9856UL,
155     0x646ba8c0UL, 0xfd62f97aUL, 0x8a65c9ecUL, 0x14015c4fUL, 0x63066cd9UL,
156     0xfa0f3d63UL, 0x8d080df5UL, 0x3b6e20c8UL, 0x4c69105eUL, 0xd56041e4UL,
157     0xa2677172UL, 0x3c03e4d1UL, 0x4b04d447UL, 0xd20d85fdUL, 0xa50ab56bUL,
158     0x35b5a8faUL, 0x42b2986cUL, 0xdbbbc9d6UL, 0xacbcf940UL, 0x32d86ce3UL,
159     0x45df5c75UL, 0xdcd60dcfUL, 0xabd13d59UL, 0x26d930acUL, 0x51de003aUL,
160     0xc8d75180UL, 0xbfd06116UL, 0x21b4f4b5UL, 0x56b3c423UL, 0xcfba9599UL,
161     0xb8bda50fUL, 0x2802b89eUL, 0x5f058808UL, 0xc60cd9b2UL, 0xb10be924UL,
162     0x2f6f7c87UL, 0x58684c11UL, 0xc1611dabUL, 0xb6662d3dUL, 0x76dc4190UL,
163     0x01db7106UL, 0x98d220bcUL, 0xefd5102aUL, 0x71b18589UL, 0x06b6b51fUL,
164     0x9fbfe4a5UL, 0xe8b8d433UL, 0x7807c9a2UL, 0x0f00f934UL, 0x9609a88eUL,
165     0xe10e9818UL, 0x7f6a0dbbUL, 0x086d3d2dUL, 0x91646c97UL, 0xe6635c01UL,
166     0x6b6b51f4UL, 0x1c6c6162UL, 0x856530d8UL, 0xf262004eUL, 0x6c0695edUL,
167     0x1b01a57bUL, 0x8208f4c1UL, 0xf50fc457UL, 0x65b0d9c6UL, 0x12b7e950UL,
168     0x8bbeb8eaUL, 0xfcb9887cUL, 0x62dd1ddfUL, 0x15da2d49UL, 0x8cd37cf3UL,
169     0xfbd44c65UL, 0x4db26158UL, 0x3ab551ceUL, 0xa3bc0074UL, 0xd4bb30e2UL,
170     0x4adfa541UL, 0x3dd895d7UL, 0xa4d1c46dUL, 0xd3d6f4fbUL, 0x4369e96aUL,
171     0x346ed9fcUL, 0xad678846UL, 0xda60b8d0UL, 0x44042d73UL, 0x33031de5UL,
172     0xaa0a4c5fUL, 0xdd0d7cc9UL, 0x5005713cUL, 0x270241aaUL, 0xbe0b1010UL,
173     0xc90c2086UL, 0x5768b525UL, 0x206f85b3UL, 0xb966d409UL, 0xce61e49fUL,
174     0x5edef90eUL, 0x29d9c998UL, 0xb0d09822UL, 0xc7d7a8b4UL, 0x59b33d17UL,
175     0x2eb40d81UL, 0xb7bd5c3bUL, 0xc0ba6cadUL, 0xedb88320UL, 0x9abfb3b6UL,
176     0x03b6e20cUL, 0x74b1d29aUL, 0xead54739UL, 0x9dd277afUL, 0x04db2615UL,
177     0x73dc1683UL, 0xe3630b12UL, 0x94643b84UL, 0x0d6d6a3eUL, 0x7a6a5aa8UL,
178     0xe40ecf0bUL, 0x9309ff9dUL, 0x0a00ae27UL, 0x7d079eb1UL, 0xf00f9344UL,
179     0x8708a3d2UL, 0x1e01f268UL, 0x6906c2feUL, 0xf762575dUL, 0x806567cbUL,
180     0x196c3671UL, 0x6e6b06e7UL, 0xfed41b76UL, 0x89d32be0UL, 0x10da7a5aUL,
181     0x67dd4accUL, 0xf9b9df6fUL, 0x8ebeeff9UL, 0x17b7be43UL, 0x60b08ed5UL,
182     0xd6d6a3e8UL, 0xa1d1937eUL, 0x38d8c2c4UL, 0x4fdff252UL, 0xd1bb67f1UL,
183     0xa6bc5767UL, 0x3fb506ddUL, 0x48b2364bUL, 0xd80d2bdaUL, 0xaf0a1b4cUL,
184     0x36034af6UL, 0x41047a60UL, 0xdf60efc3UL, 0xa867df55UL, 0x316e8eefUL,
185     0x4669be79UL, 0xcb61b38cUL, 0xbc66831aUL, 0x256fd2a0UL, 0x5268e236UL,
186     0xcc0c7795UL, 0xbb0b4703UL, 0x220216b9UL, 0x5505262fUL, 0xc5ba3bbeUL,
187     0xb2bd0b28UL, 0x2bb45a92UL, 0x5cb36a04UL, 0xc2d7ffa7UL, 0xb5d0cf31UL,
188     0x2cd99e8bUL, 0x5bdeae1dUL, 0x9b64c2b0UL, 0xec63f226UL, 0x756aa39cUL,
189     0x026d930aUL, 0x9c0906a9UL, 0xeb0e363fUL, 0x72076785UL, 0x05005713UL,
190     0x95bf4a82UL, 0xe2b87a14UL, 0x7bb12baeUL, 0x0cb61b38UL, 0x92d28e9bUL,
191     0xe5d5be0dUL, 0x7cdcefb7UL, 0x0bdbdf21UL, 0x86d3d2d4UL, 0xf1d4e242UL,
192     0x68ddb3f8UL, 0x1fda836eUL, 0x81be16cdUL, 0xf6b9265bUL, 0x6fb077e1UL,
193     0x18b74777UL, 0x88085ae6UL, 0xff0f6a70UL, 0x66063bcaUL, 0x11010b5cUL,
194     0x8f659effUL, 0xf862ae69UL, 0x616bffd3UL, 0x166ccf45UL, 0xa00ae278UL,
195     0xd70dd2eeUL, 0x4e048354UL, 0x3903b3c2UL, 0xa7672661UL, 0xd06016f7UL,
196     0x4969474dUL, 0x3e6e77dbUL, 0xaed16a4aUL, 0xd9d65adcUL, 0x40df0b66UL,
197     0x37d83bf0UL, 0xa9bcae53UL, 0xdebb9ec5UL, 0x47b2cf7fUL, 0x30b5ffe9UL,
198     0xbdbdf21cUL, 0xcabac28aUL, 0x53b39330UL, 0x24b4a3a6UL, 0xbad03605UL,
199     0xcdd70693UL, 0x54de5729UL, 0x23d967bfUL, 0xb3667a2eUL, 0xc4614ab8UL,
200     0x5d681b02UL, 0x2a6f2b94UL, 0xb40bbe37UL, 0xc30c8ea1UL, 0x5a05df1bUL,
201     0x2d02ef8dUL
202 };
203 
204 #ifdef _LP64
205 juint StubRoutines::x86::_crc_table_avx512[] =
206 {
207     0xe95c1271UL, 0x00000000UL, 0xce3371cbUL, 0x00000000UL,
208     0xccaa009eUL, 0x00000000UL, 0x751997d0UL, 0x00000001UL,
209     0x4a7fe880UL, 0x00000001UL, 0xe88ef372UL, 0x00000001UL,
210     0xccaa009eUL, 0x00000000UL, 0x63cd6124UL, 0x00000001UL,
211     0xf7011640UL, 0x00000001UL, 0xdb710640UL, 0x00000001UL,
212     0xd7cfc6acUL, 0x00000001UL, 0xea89367eUL, 0x00000001UL,
213     0x8cb44e58UL, 0x00000001UL, 0xdf068dc2UL, 0x00000000UL,
214     0xae0b5394UL, 0x00000000UL, 0xc7569e54UL, 0x00000001UL,
215     0xc6e41596UL, 0x00000001UL, 0x54442bd4UL, 0x00000001UL,
216     0x74359406UL, 0x00000001UL, 0x3db1ecdcUL, 0x00000000UL,
217     0x5a546366UL, 0x00000001UL, 0xf1da05aaUL, 0x00000000UL,
218     0xccaa009eUL, 0x00000000UL, 0x751997d0UL, 0x00000001UL,
219     0x00000000UL, 0x00000000UL, 0x00000000UL, 0x00000000UL
220 };
221 
222 juint StubRoutines::x86::_crc32c_table_avx512[] =
223 {
224     0xb9e02b86UL, 0x00000000UL, 0xdcb17aa4UL, 0x00000000UL,
225     0x493c7d27UL, 0x00000000UL, 0xc1068c50UL, 0x0000000eUL,
226     0x06e38d70UL, 0x00000002UL, 0x6992cea2UL, 0x00000000UL,
227     0x493c7d27UL, 0x00000000UL, 0xdd45aab8UL, 0x00000000UL,
228     0xdea713f0UL, 0x00000000UL, 0x05ec76f0UL, 0x00000001UL,
229     0x47db8317UL, 0x00000000UL, 0x2ad91c30UL, 0x00000000UL,
230     0x0715ce53UL, 0x00000000UL, 0xc49f4f67UL, 0x00000000UL,
231     0x39d3b296UL, 0x00000000UL, 0x083a6eecUL, 0x00000000UL,
232     0x9e4addf8UL, 0x00000000UL, 0x740eef02UL, 0x00000000UL,
233     0xddc0152bUL, 0x00000000UL, 0x1c291d04UL, 0x00000000UL,
234     0xba4fc28eUL, 0x00000000UL, 0x3da6d0cbUL, 0x00000000UL,
235     0x493c7d27UL, 0x00000000UL, 0xc1068c50UL, 0x0000000eUL,
236     0x00000000UL, 0x00000000UL, 0x00000000UL, 0x00000000UL
237 };
238 
239 juint StubRoutines::x86::_crc_by128_masks_avx512[] =
240 {
241     0xffffffffUL, 0xffffffffUL, 0x00000000UL, 0x00000000UL,
242     0x00000000UL, 0xffffffffUL, 0xffffffffUL, 0xffffffffUL,
243     0x80808080UL, 0x80808080UL, 0x80808080UL, 0x80808080UL
244 };
245 
246 juint StubRoutines::x86::_shuf_table_crc32_avx512[] =
247 {
248     0x83828100UL, 0x87868584UL, 0x8b8a8988UL, 0x8f8e8d8cUL,
249     0x03020100UL, 0x07060504UL, 0x0b0a0908UL, 0x000e0d0cUL
250 };
251 
252 juint StubRoutines::x86::_adler32_ascale_table[] =
253 {
254     0x00000000UL, 0x00000001UL, 0x00000002UL, 0x00000003UL,
255     0x00000004UL, 0x00000005UL, 0x00000006UL, 0x00000007UL
256 };
257 
258 juint StubRoutines::x86::_adler32_shuf0_table[] =
259 {
260     0xFFFFFF00UL, 0xFFFFFF01UL, 0xFFFFFF02UL, 0xFFFFFF03UL,
261     0xFFFFFF04UL, 0xFFFFFF05UL, 0xFFFFFF06UL, 0xFFFFFF07UL
262 };
263 
264 juint StubRoutines::x86::_adler32_shuf1_table[] =
265 {
266     0xFFFFFF08UL, 0xFFFFFF09, 0xFFFFFF0AUL, 0xFFFFFF0BUL,
267     0xFFFFFF0CUL, 0xFFFFFF0D, 0xFFFFFF0EUL, 0xFFFFFF0FUL
268 };
269 
270 #endif // _LP64
271 
272 #define D 32
273 #define P 0x82F63B78 // Reflection of Castagnoli (0x11EDC6F41)
274 
275 #define TILL_CYCLE 31
276 uint32_t _crc32c_pow_2k_table[TILL_CYCLE]; // because _crc32c_pow_2k_table[TILL_CYCLE == 31] == _crc32c_pow_2k_table[0]
277 
278 // A. Kadatch and B. Jenkins / Everything we know about CRC but afraid to forget September 3, 2010 8
279 // Listing 1: Multiplication of normalized polynomials
280 // "a" and "b" occupy D least significant bits.
281 uint32_t crc32c_multiply(uint32_t a, uint32_t b) {
282   uint32_t product = 0;
283   uint32_t b_pow_x_table[D + 1]; // b_pow_x_table[k] = (b * x**k) mod P
284   b_pow_x_table[0] = b;
285   for (int k = 0; k < D; ++k) {
286     // If "a" has non-zero coefficient at x**k,/ add ((b * x**k) mod P) to the result.
287     if ((a & (((uint32_t)1) << (D - 1 - k))) != 0) product ^= b_pow_x_table[k];
288 
289     // Compute b_pow_x_table[k+1] = (b ** x**(k+1)) mod P.
290     if (b_pow_x_table[k] & 1) {
291       // If degree of (b_pow_x_table[k] * x) is D, then
292       // degree of (b_pow_x_table[k] * x - P) is less than D.
293       b_pow_x_table[k + 1] = (b_pow_x_table[k] >> 1) ^ P;
294     }
295     else {
296       b_pow_x_table[k + 1] = b_pow_x_table[k] >> 1;
297     }
298   }
299   return product;
300 }
301 #undef D
302 #undef P
303 
304 // A. Kadatch and B. Jenkins / Everything we know about CRC but afraid to forget September 3, 2010 9
305 void crc32c_init_pow_2k(void) {
306   // _crc32c_pow_2k_table(0) =
307   // x^(2^k) mod P(x) = x mod P(x) = x
308   // Since we are operating on a reflected values
309   // x = 10b, reflect(x) = 0x40000000
310   _crc32c_pow_2k_table[0] = 0x40000000;
311 
312   for (int k = 1; k < TILL_CYCLE; k++) {
313     // _crc32c_pow_2k_table(k+1) = _crc32c_pow_2k_table(k-1)^2 mod P(x)
314     uint32_t tmp = _crc32c_pow_2k_table[k - 1];
315     _crc32c_pow_2k_table[k] = crc32c_multiply(tmp, tmp);
316   }
317 }
318 
319 // x^N mod P(x)
320 uint32_t crc32c_f_pow_n(uint32_t n) {
321   //            result = 1 (polynomial)
322   uint32_t one, result = 0x80000000, i = 0;
323 
324   while (one = (n & 1), (n == 1 || n - one > 0)) {
325     if (one) {
326       result = crc32c_multiply(result, _crc32c_pow_2k_table[i]);
327     }
328     n >>= 1;
329     i++;
330   }
331 
332   return result;
333 }
334 
335 juint *StubRoutines::x86::_crc32c_table;
336 
337 void StubRoutines::x86::generate_CRC32C_table(bool is_pclmulqdq_table_supported) {
338 
339   static juint pow_n[CRC32C_NUM_PRECOMPUTED_CONSTANTS];
340 
341   crc32c_init_pow_2k();
342 
343   pow_n[0] = crc32c_f_pow_n(CRC32C_HIGH * 8);      // 8N * 8 = 64N
344   pow_n[1] = crc32c_f_pow_n(CRC32C_HIGH * 8 * 2);  // 128N
345 
346   pow_n[2] = crc32c_f_pow_n(CRC32C_MIDDLE * 8);
347   pow_n[3] = crc32c_f_pow_n(CRC32C_MIDDLE * 8 * 2);
348 
349   pow_n[4] = crc32c_f_pow_n(CRC32C_LOW * 8);
350   pow_n[CRC32C_NUM_PRECOMPUTED_CONSTANTS - 1] =
351             crc32c_f_pow_n(CRC32C_LOW * 8 * 2);
352 
353   if (is_pclmulqdq_table_supported) {
354     _crc32c_table = pow_n;
355   } else {
356     static julong pclmulqdq_table[CRC32C_NUM_PRECOMPUTED_CONSTANTS * 256];
357 
358     for (int j = 0; j < CRC32C_NUM_PRECOMPUTED_CONSTANTS; j++) {
359       static juint X_CONST = pow_n[j];
360       for (int64_t i = 0; i < 256; i++) { // to force 64 bit wide computations
361       // S. Gueron / Information Processing Letters 112 (2012) 184
362       // Algorithm 3: Generating a carry-less multiplication lookup table.
363       // Input: A 32-bit constant, X_CONST.
364       // Output: A table of 256 entries, each one is a 64-bit quadword,
365       // that can be used for computing "byte" * X_CONST, for a given byte.
366         pclmulqdq_table[j * 256 + i] =
367           ((i & 1) * X_CONST) ^ ((i & 2) * X_CONST) ^ ((i & 4) * X_CONST) ^
368           ((i & 8) * X_CONST) ^ ((i & 16) * X_CONST) ^ ((i & 32) * X_CONST) ^
369           ((i & 64) * X_CONST) ^ ((i & 128) * X_CONST);
370       }
371     }
372     _crc32c_table = (juint*)pclmulqdq_table;
373   }
374 }
375 
376 ATTRIBUTE_ALIGNED(64) juint StubRoutines::x86::_k256[] =
377 {
378     0x428a2f98UL, 0x71374491UL, 0xb5c0fbcfUL, 0xe9b5dba5UL,
379     0x3956c25bUL, 0x59f111f1UL, 0x923f82a4UL, 0xab1c5ed5UL,
380     0xd807aa98UL, 0x12835b01UL, 0x243185beUL, 0x550c7dc3UL,
381     0x72be5d74UL, 0x80deb1feUL, 0x9bdc06a7UL, 0xc19bf174UL,
382     0xe49b69c1UL, 0xefbe4786UL, 0x0fc19dc6UL, 0x240ca1ccUL,
383     0x2de92c6fUL, 0x4a7484aaUL, 0x5cb0a9dcUL, 0x76f988daUL,
384     0x983e5152UL, 0xa831c66dUL, 0xb00327c8UL, 0xbf597fc7UL,
385     0xc6e00bf3UL, 0xd5a79147UL, 0x06ca6351UL, 0x14292967UL,
386     0x27b70a85UL, 0x2e1b2138UL, 0x4d2c6dfcUL, 0x53380d13UL,
387     0x650a7354UL, 0x766a0abbUL, 0x81c2c92eUL, 0x92722c85UL,
388     0xa2bfe8a1UL, 0xa81a664bUL, 0xc24b8b70UL, 0xc76c51a3UL,
389     0xd192e819UL, 0xd6990624UL, 0xf40e3585UL, 0x106aa070UL,
390     0x19a4c116UL, 0x1e376c08UL, 0x2748774cUL, 0x34b0bcb5UL,
391     0x391c0cb3UL, 0x4ed8aa4aUL, 0x5b9cca4fUL, 0x682e6ff3UL,
392     0x748f82eeUL, 0x78a5636fUL, 0x84c87814UL, 0x8cc70208UL,
393     0x90befffaUL, 0xa4506cebUL, 0xbef9a3f7UL, 0xc67178f2UL
394 };
395 
396 #ifdef _LP64
397 // used in MacroAssembler::sha256_AVX2
398 // dynamically built from _k256
399 ATTRIBUTE_ALIGNED(64) juint StubRoutines::x86::_k256_W[2*sizeof(StubRoutines::x86::_k256)];
400 
401 // used in MacroAssembler::sha512_AVX2
402 ATTRIBUTE_ALIGNED(64) julong StubRoutines::x86::_k512_W[] =
403 {
404     0x428a2f98d728ae22ULL, 0x7137449123ef65cdULL,
405     0xb5c0fbcfec4d3b2fULL, 0xe9b5dba58189dbbcULL,
406     0x3956c25bf348b538ULL, 0x59f111f1b605d019ULL,
407     0x923f82a4af194f9bULL, 0xab1c5ed5da6d8118ULL,
408     0xd807aa98a3030242ULL, 0x12835b0145706fbeULL,
409     0x243185be4ee4b28cULL, 0x550c7dc3d5ffb4e2ULL,
410     0x72be5d74f27b896fULL, 0x80deb1fe3b1696b1ULL,
411     0x9bdc06a725c71235ULL, 0xc19bf174cf692694ULL,
412     0xe49b69c19ef14ad2ULL, 0xefbe4786384f25e3ULL,
413     0x0fc19dc68b8cd5b5ULL, 0x240ca1cc77ac9c65ULL,
414     0x2de92c6f592b0275ULL, 0x4a7484aa6ea6e483ULL,
415     0x5cb0a9dcbd41fbd4ULL, 0x76f988da831153b5ULL,
416     0x983e5152ee66dfabULL, 0xa831c66d2db43210ULL,
417     0xb00327c898fb213fULL, 0xbf597fc7beef0ee4ULL,
418     0xc6e00bf33da88fc2ULL, 0xd5a79147930aa725ULL,
419     0x06ca6351e003826fULL, 0x142929670a0e6e70ULL,
420     0x27b70a8546d22ffcULL, 0x2e1b21385c26c926ULL,
421     0x4d2c6dfc5ac42aedULL, 0x53380d139d95b3dfULL,
422     0x650a73548baf63deULL, 0x766a0abb3c77b2a8ULL,
423     0x81c2c92e47edaee6ULL, 0x92722c851482353bULL,
424     0xa2bfe8a14cf10364ULL, 0xa81a664bbc423001ULL,
425     0xc24b8b70d0f89791ULL, 0xc76c51a30654be30ULL,
426     0xd192e819d6ef5218ULL, 0xd69906245565a910ULL,
427     0xf40e35855771202aULL, 0x106aa07032bbd1b8ULL,
428     0x19a4c116b8d2d0c8ULL, 0x1e376c085141ab53ULL,
429     0x2748774cdf8eeb99ULL, 0x34b0bcb5e19b48a8ULL,
430     0x391c0cb3c5c95a63ULL, 0x4ed8aa4ae3418acbULL,
431     0x5b9cca4f7763e373ULL, 0x682e6ff3d6b2b8a3ULL,
432     0x748f82ee5defb2fcULL, 0x78a5636f43172f60ULL,
433     0x84c87814a1f0ab72ULL, 0x8cc702081a6439ecULL,
434     0x90befffa23631e28ULL, 0xa4506cebde82bde9ULL,
435     0xbef9a3f7b2c67915ULL, 0xc67178f2e372532bULL,
436     0xca273eceea26619cULL, 0xd186b8c721c0c207ULL,
437     0xeada7dd6cde0eb1eULL, 0xf57d4f7fee6ed178ULL,
438     0x06f067aa72176fbaULL, 0x0a637dc5a2c898a6ULL,
439     0x113f9804bef90daeULL, 0x1b710b35131c471bULL,
440     0x28db77f523047d84ULL, 0x32caab7b40c72493ULL,
441     0x3c9ebe0a15c9bebcULL, 0x431d67c49c100d4cULL,
442     0x4cc5d4becb3e42b6ULL, 0x597f299cfc657e2aULL,
443     0x5fcb6fab3ad6faecULL, 0x6c44198c4a475817ULL,
444 };
445 #endif