feat: avoid String.toUpper() and implement Regular Expression based…

… `StringUtils.startsWithIgnoringCase()`
h2database · Feb 1, 2024 · 136a77c · grandinj · Feb 1, 2024 · manticore-projects
1 parent 9e88133
commit 136a77c
Show file tree

Hide file tree

Showing 2 changed files with 61 additions and 25 deletions.
diff --git a/h2/src/main/org/h2/bnf/context/DbContextRule.java b/h2/src/main/org/h2/bnf/context/DbContextRule.java
@@ -69,27 +69,27 @@ public void accept(BnfVisitor visitor) {
 
     @Override
     public boolean autoComplete(Sentence sentence) {
-        String query = sentence.getQuery(), s = query;
-        String up = sentence.getQueryUpper();
+        final String query = sentence.getQuery();
+        String s = query;
         switch (type) {
         case SCHEMA: {
             DbSchema[] schemas = contents.getSchemas();
             String best = null;
             DbSchema bestSchema = null;
             for (DbSchema schema: schemas) {
-                String name = StringUtils.toUpperEnglish(schema.name);
-                String quotedName = StringUtils.quoteIdentifier(schema.name);
-                if (up.startsWith(name)) {
+                String name = schema.name;
+                String quotedName = StringUtils.quoteIdentifier(name);
+                if (StringUtils.startsWithIgnoringCase(query, name)) {
                     if (best == null || name.length() > best.length()) {
                         best = name;
                         bestSchema = schema;
                     }
-                } else if (query.startsWith(quotedName)) {
+                } else if (StringUtils.startsWith(query, quotedName)) {
                     if (best == null || name.length() > best.length()) {
                         best = quotedName;
                         bestSchema = schema;
                     }
-                } else if (s.isEmpty() || name.startsWith(up) || quotedName.startsWith(query) ) {
+                } else if (s.isEmpty() || StringUtils.startsWithIgnoringCase(name, query) ||  StringUtils.startsWithIgnoringCase(quotedName, query)) {
                     if (s.length() < name.length()) {
                         sentence.add(name, name.substring(s.length()), type);
                         sentence.add(schema.quotedName + ".",
@@ -113,15 +113,15 @@ public boolean autoComplete(Sentence sentence) {
             String best = null;
             DbTableOrView bestTable = null;
             for (DbTableOrView table : tables) {
-                String name = StringUtils.toUpperEnglish(table.getName());
-                String quotedName = StringUtils.quoteIdentifier(StringUtils.toUpperEnglish(table.getName()));
+                String name = table.getName();
+                String quotedName = StringUtils.quoteIdentifier(name);
 
-                if (up.startsWith(name) || ("\"" + up).startsWith(quotedName)) {
+                if (StringUtils.startsWithIgnoringCase(query, name) || StringUtils.startsWithIgnoringCase("\"" + query, quotedName)) {
                     if (best == null || name.length() > best.length()) {
                         best = name;
                         bestTable = table;
                     }
-                } else if (s.isEmpty() || name.startsWith(up) || quotedName.startsWith(up)) {
+                } else if (s.isEmpty() || StringUtils.startsWithIgnoringCase(name, query) ||  StringUtils.startsWithIgnoringCase(quotedName, query)) {
                     if (s.length() < name.length()) {
                         sentence.add(table.getQuotedName(),
                                 table.getQuotedName().substring(s.length()),
@@ -147,16 +147,16 @@ public boolean autoComplete(Sentence sentence) {
             if (query.indexOf(' ') < 0) {
                 break;
             }
-            for (; i < up.length(); i++) {
-                char ch = up.charAt(i);
+            for (; i < query.length(); i++) {
+                char ch = query.charAt(i);
                 if (ch != '_' && !Character.isLetterOrDigit(ch)) {
                     break;
                 }
             }
             if (i == 0) {
                 break;
             }
-            String alias = up.substring(0, i);
+            String alias = query.substring(0, i);
             if (ParserUtil.isKeyword(alias, false)) {
                 break;
             }
@@ -169,17 +169,17 @@ public boolean autoComplete(Sentence sentence) {
             DbTableOrView last = sentence.getLastMatchedTable();
             if (last != null && last.getColumns() != null) {
                 for (DbColumn column : last.getColumns()) {
-                    String compare = up;
-                    String name = StringUtils.toUpperEnglish(column.getName());
+                    String compare = query;
+                    String name = column.getName();
                     if (column.getQuotedName().length() > name.length()) {
                         name = column.getQuotedName();
                         compare = query;
                     }
-                    if (compare.startsWith(name) && testColumnType(column)) {
+                    if (StringUtils.startsWithIgnoringCase(compare, name) && testColumnType(column)) {
                         String b = s.substring(name.length());
                         if (best == null || b.length() < best.length()) {
                             best = b;
-                        } else if (s.length() == 0 || name.startsWith(compare)) {
+                        } else if (s.isEmpty() || StringUtils.startsWithIgnoringCase(name, compare)) {
                             if (s.length() < name.length()) {
                                 sentence.add(column.getName(),
                                         column.getName().substring(s.length()),
@@ -198,15 +198,14 @@ public boolean autoComplete(Sentence sentence) {
                         continue;
                     }
                     for (DbColumn column : table.getColumns()) {
-                        String name = StringUtils.toUpperEnglish(column
-                                .getName());
+                        String name = column.getName();
                         if (testColumnType(column)) {
-                            if (up.startsWith(name)) {
+                            if (StringUtils.startsWithIgnoringCase(query, name)) {
                                 String b = s.substring(name.length());
                                 if (best == null || b.length() < best.length()) {
                                     best = b;
                                 }
-                            } else if (s.length() == 0 || name.startsWith(up)) {
+                            } else if (s.isEmpty() || StringUtils.startsWithIgnoringCase(name, query)) {
                                 if (s.length() < name.length()) {
                                     sentence.add(column.getName(),
                                             column.getName().substring(s.length()),
@@ -329,7 +328,7 @@ private static String autoCompleteTableAlias(Sentence sentence,
                 return s;
             }
             s = s.substring(alias.length());
-            if (s.length() == 0) {
+            if (s.isEmpty()) {
                 sentence.add(alias + ".", ".", Sentence.CONTEXT);
             }
             return s;
@@ -344,15 +343,15 @@ private static String autoCompleteTableAlias(Sentence sentence,
                         (best == null || tableName.length() > best.length())) {
                     sentence.setLastMatchedTable(table);
                     best = tableName;
-                } else if (s.length() == 0 || tableName.startsWith(alias)) {
+                } else if (s.isEmpty() || tableName.startsWith(alias)) {
                     sentence.add(tableName + ".",
                             tableName.substring(s.length()) + ".",
                             Sentence.CONTEXT);
                 }
             }
             if (best != null) {
                 s = s.substring(best.length());
-                if (s.length() == 0) {
+                if (s.isEmpty()) {
                     sentence.add(alias + ".", ".", Sentence.CONTEXT);
                 }
                 return s;

diff --git a/h2/src/main/org/h2/util/StringUtils.java b/h2/src/main/org/h2/util/StringUtils.java
@@ -9,12 +9,15 @@
 import java.lang.ref.SoftReference;
 import java.net.URLEncoder;
 import java.nio.charset.StandardCharsets;
+import java.text.Normalizer;
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.HashSet;
 import java.util.Locale;
 import java.util.concurrent.TimeUnit;
 import java.util.function.IntPredicate;
+import java.util.regex.Matcher;
+import java.util.regex.Pattern;
 
 import org.h2.api.ErrorCode;
 import org.h2.engine.SysProperties;
@@ -1383,4 +1386,38 @@ public static String escapeMetaDataPattern(String pattern) {
         return replaceAll(pattern, "\\", "\\\\");
     }
 
+    /**
+     * Case-sensitive check if a {@param text} starts with a {@param prefix}.
+     * It only calls {@code String.startsWith()} and is only here for API consistency
+     *
+     * @param text the full text starting with a prefix
+     * @param prefix the full text starting with a prefix
+     * @return TRUE only if text starts with the prefix
+     */
+    public static boolean startsWith(String text, String prefix) {
+        return text.startsWith(prefix);
+    }
+
+    /**
+     * Case-Insensitive check if a {@param text} starts with a {@param prefix}.
+     * It is used
+     *
+     * @param text the full text starting with a prefix
+     * @param prefix the full text starting with a prefix
+     * @return TRUE only if text starts with the prefix
+     */
+    public static boolean startsWithIgnoringCase(String text, String prefix) {
+        String normalizedText = Normalizer.normalize(text, Normalizer.Form.NFD)
+                                          .replaceAll("\\p{M}", "");
+        String normalizedPrefix = Normalizer.normalize(prefix, Normalizer.Form.NFD)
+                                            .replaceAll("\\p{M}", "");
+
+        final Pattern pattern = Pattern.compile(
+                "^" + normalizedPrefix
+                , Pattern.MULTILINE | Pattern.CASE_INSENSITIVE | Pattern.COMMENTS | Pattern.UNICODE_CASE);
+
+        final Matcher matcher = pattern.matcher(normalizedText);
+        return matcher.find();
+    }
+
 }