blob: acab52bbe8fcebd2b647c1e1d50d3e54ce95f177 [file] [log] [blame]
Alina Zaidid07acba2021-03-09 21:23:35 +00001/*
2 * Copyright (C) 2021 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17package com.android.launcher3.search;
18
19import java.text.Collator;
20
21/**
22 * Utilities for matching query string to target string.
23 */
24public class StringMatcherUtility {
25
26 /**
27 * Returns {@code true} is {@code query} is a prefix substring of a complete word/phrase in
28 * {@code target}.
29 */
30 public static boolean matches(String query, String target, StringMatcher matcher) {
31 int queryLength = query.length();
32
33 int targetLength = target.length();
34
35 if (targetLength < queryLength || queryLength <= 0) {
36 return false;
37 }
38
39 if (requestSimpleFuzzySearch(query)) {
40 return target.toLowerCase().contains(query);
41 }
42
43 int lastType;
44 int thisType = Character.UNASSIGNED;
45 int nextType = Character.getType(target.codePointAt(0));
46
47 int end = targetLength - queryLength;
48 for (int i = 0; i <= end; i++) {
49 lastType = thisType;
50 thisType = nextType;
51 nextType = i < (targetLength - 1)
52 ? Character.getType(target.codePointAt(i + 1)) : Character.UNASSIGNED;
53 if (isBreak(thisType, lastType, nextType)
54 && matcher.matches(query, target.substring(i, i + queryLength))) {
55 return true;
56 }
57 }
58 return false;
59 }
60
61 /**
62 * Returns true if the current point should be a break point. Following cases
63 * are considered as break points:
64 * 1) Any non space character after a space character
65 * 2) Any digit after a non-digit character
66 * 3) Any capital character after a digit or small character
67 * 4) Any capital character before a small character
68 */
69 private static boolean isBreak(int thisType, int prevType, int nextType) {
70 switch (prevType) {
71 case Character.UNASSIGNED:
72 case Character.SPACE_SEPARATOR:
73 case Character.LINE_SEPARATOR:
74 case Character.PARAGRAPH_SEPARATOR:
75 return true;
76 }
77 switch (thisType) {
78 case Character.UPPERCASE_LETTER:
79 if (nextType == Character.UPPERCASE_LETTER) {
80 return true;
81 }
82 // Follow through
83 case Character.TITLECASE_LETTER:
84 // Break point if previous was not a upper case
85 return prevType != Character.UPPERCASE_LETTER;
86 case Character.LOWERCASE_LETTER:
87 // Break point if previous was not a letter.
88 return prevType > Character.OTHER_LETTER || prevType <= Character.UNASSIGNED;
89 case Character.DECIMAL_DIGIT_NUMBER:
90 case Character.LETTER_NUMBER:
91 case Character.OTHER_NUMBER:
92 // Break point if previous was not a number
93 return !(prevType == Character.DECIMAL_DIGIT_NUMBER
94 || prevType == Character.LETTER_NUMBER
95 || prevType == Character.OTHER_NUMBER);
96 case Character.MATH_SYMBOL:
97 case Character.CURRENCY_SYMBOL:
98 case Character.OTHER_PUNCTUATION:
99 case Character.DASH_PUNCTUATION:
100 // Always a break point for a symbol
101 return true;
102 default:
103 return false;
104 }
105 }
106
107 /**
108 * Performs locale sensitive string comparison using {@link Collator}.
109 */
110 public static class StringMatcher {
111
112 private static final char MAX_UNICODE = '\uFFFF';
113
114 private final Collator mCollator;
115
116 StringMatcher() {
117 // On android N and above, Collator uses ICU implementation which has a much better
118 // support for non-latin locales.
119 mCollator = Collator.getInstance();
120 mCollator.setStrength(Collator.PRIMARY);
121 mCollator.setDecomposition(Collator.CANONICAL_DECOMPOSITION);
122 }
123
124 /**
125 * Returns true if {@param query} is a prefix of {@param target}
126 */
127 public boolean matches(String query, String target) {
128 switch (mCollator.compare(query, target)) {
129 case 0:
130 return true;
131 case -1:
132 // The target string can contain a modifier which would make it larger than
133 // the query string (even though the length is same). If the query becomes
134 // larger after appending a unicode character, it was originally a prefix of
135 // the target string and hence should match.
136 return mCollator.compare(query + MAX_UNICODE, target) > -1;
137 default:
138 return false;
139 }
140 }
141
142 public static StringMatcher getInstance() {
143 return new StringMatcher();
144 }
145 }
146
147 /**
148 * Matching optimization to search in Chinese.
149 */
150 private static boolean requestSimpleFuzzySearch(String s) {
151 for (int i = 0; i < s.length(); ) {
152 int codepoint = s.codePointAt(i);
153 i += Character.charCount(codepoint);
154 switch (Character.UnicodeScript.of(codepoint)) {
155 case HAN:
156 //Character.UnicodeScript.HAN: use String.contains to match
157 return true;
158 }
159 }
160 return false;
161 }
162}