1 /* 2 * Copyright (c) 2021, 2023, Oracle and/or its affiliates. All rights reserved. 3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. 4 * 5 * This code is free software; you can redistribute it and/or modify it 6 * under the terms of the GNU General Public License version 2 only, as 7 * published by the Free Software Foundation. 8 * 9 * This code is distributed in the hope that it will be useful, but WITHOUT 10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License 12 * version 2 for more details (a copy is included in the LICENSE file that 13 * accompanied this code). 14 * 15 * You should have received a copy of the GNU General Public License version 16 * 2 along with this work; if not, write to the Free Software Foundation, 17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. 18 * 19 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA 20 * or visit www.oracle.com if you need additional information or have any 21 * questions. 22 * 23 */ 24 25 import java.lang.foreign.Arena; 26 import java.lang.foreign.MemorySegment; 27 28 import org.testng.annotations.*; 29 import static org.testng.Assert.*; 30 31 /* 32 * @test 33 * @enablePreview 34 * @requires jdk.foreign.linker != "UNSUPPORTED" 35 * @run testng TestStringEncoding 36 */ 37 38 public class TestStringEncoding { 39 40 @Test(dataProvider = "strings") 41 public void testStrings(String testString, int expectedByteLength) { 42 try (Arena arena = Arena.ofConfined()) { 43 MemorySegment text = arena.allocateUtf8String(testString); 44 45 assertEquals(text.byteSize(), expectedByteLength); 46 47 String roundTrip = text.getUtf8String(0); 48 assertEquals(roundTrip, testString); 49 } 50 } 51 52 @DataProvider 53 public static Object[][] strings() { 54 return new Object[][] { 55 { "testing", 8 }, 56 { "", 1 }, 57 { "X", 2 }, 58 { "12345", 6 }, 59 { "yen \u00A5", 7 }, // in UTF-8 2 bytes: 0xC2 0xA5 60 { "snowman \u26C4", 12 }, // in UTF-8 three bytes: 0xE2 0x9B 0x84 61 { "rainbow \uD83C\uDF08", 13 } // in UTF-8 four bytes: 0xF0 0x9F 0x8C 0x88 62 }; 63 } 64 }