From 9eabd8b4ddbc8022c1ac6c50f4a68898251b28a0 Mon Sep 17 00:00:00 2001 From: dpeger Date: Fri, 23 Apr 2021 22:28:08 +0200 Subject: [PATCH] [#73] Avoid `String` creation using system default charset Used `StandardCharsets.UTF_8` to create `String` in `JSONParserByteArray` to avoid dependency on system's default charset and added additional emoji test. Fixes #73 --- .../java/net/minidev/json/parser/JSONParserByteArray.java | 7 +++++-- .../src/test/java/net/minidev/json/test/TestUtf8.java | 3 ++- 2 files changed, 7 insertions(+), 3 deletions(-) diff --git a/json-smart/src/main/java/net/minidev/json/parser/JSONParserByteArray.java b/json-smart/src/main/java/net/minidev/json/parser/JSONParserByteArray.java index 2e8efd8..348bce9 100644 --- a/json-smart/src/main/java/net/minidev/json/parser/JSONParserByteArray.java +++ b/json-smart/src/main/java/net/minidev/json/parser/JSONParserByteArray.java @@ -19,6 +19,9 @@ import net.minidev.json.JSONValue; import net.minidev.json.writer.JsonReaderI; +import java.nio.charset.Charset; +import java.nio.charset.StandardCharsets; + /** * Parser for JSON text. Please note that JSONParser is NOT thread-safe. * @@ -59,7 +62,7 @@ public T parse(byte[] in, JsonReaderI mapper) throws ParseException { } protected void extractString(int beginIndex, int endIndex) { - xs = new String(in, beginIndex, endIndex - beginIndex); + xs = new String(in, beginIndex, endIndex - beginIndex, StandardCharsets.UTF_8); } protected void extractStringTrim(int start, int stop) { @@ -71,7 +74,7 @@ protected void extractStringTrim(int start, int stop) { while ((start < stop) && (val[stop - 1] <= ' ')) { stop--; } - xs = new String(in, start, stop - start); + xs = new String(in, start, stop - start, StandardCharsets.UTF_8); } protected int indexOf(char c, int pos) { diff --git a/json-smart/src/test/java/net/minidev/json/test/TestUtf8.java b/json-smart/src/test/java/net/minidev/json/test/TestUtf8.java index 334187d..9058cbd 100644 --- a/json-smart/src/test/java/net/minidev/json/test/TestUtf8.java +++ b/json-smart/src/test/java/net/minidev/json/test/TestUtf8.java @@ -19,7 +19,8 @@ public static Stream languages() { Arguments.of("Russian", "Русский"), Arguments.of("Farsi", "فارسی"), Arguments.of("Korean", "한국어"), Arguments.of("Armenian", "Հայերեն"), Arguments.of("Hindi", "हिन्दी"), Arguments.of("Hebrew", "עברית"), Arguments.of("Chinese", "中文"), Arguments.of("Amharic", "አማርኛ"), Arguments.of("Malayalam", "മലയാളം"), - Arguments.of("Assyrian Neo-Aramaic", "ܐܬܘܪܝܐ"), Arguments.of("Georgian", "მარგალური")); + Arguments.of("Assyrian Neo-Aramaic", "ܐܬܘܪܝܐ"), Arguments.of("Georgian", "მარგალური"), + Arguments.of("Emojis", "🐶🐱🐭🐹🐰🦊🐻🐼🐻‍❄🐨🐯🦁🐮🐷🐽🐸🐵🙈🙉🙊🐒🐔🐧🐦🐤🐣🐥🦆🦅🦉🦇🐺🐗🐴🦄🐝🐛")); }; @ParameterizedTest