OLD | NEW |
1 // Copyright (c) 2011 The Chromium Authors. All rights reserved. | 1 // Copyright (c) 2011 The Chromium Authors. All rights reserved. |
2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
4 | 4 |
5 #include "base/i18n/string_search.h" | 5 #include "base/i18n/string_search.h" |
6 #include "base/logging.h" | 6 #include "base/logging.h" |
7 | 7 |
8 #include "third_party/icu/public/i18n/unicode/usearch.h" | 8 #include "third_party/icu/public/i18n/unicode/usearch.h" |
9 | 9 |
10 namespace { | 10 namespace base { |
| 11 namespace i18n { |
11 | 12 |
12 bool CollationSensitiveStringSearch(const string16& find_this, | 13 FixedPatternStringSearchIgnoringCaseAndAccents:: |
13 const string16& in_this, | 14 FixedPatternStringSearchIgnoringCaseAndAccents(const string16& find_this) |
14 UCollationStrength strength, | 15 : find_this_(find_this) { |
15 size_t* match_index, | 16 // usearch_open requires a valid string argument to be searched, even if we |
16 size_t* match_length) { | 17 // want to set it by usearch_setText afterwards. So, supplying a dummy text. |
| 18 const string16& dummy = find_this_; |
| 19 |
17 UErrorCode status = U_ZERO_ERROR; | 20 UErrorCode status = U_ZERO_ERROR; |
| 21 search_ = usearch_open(find_this_.data(), find_this_.size(), |
| 22 dummy.data(), dummy.size(), |
| 23 uloc_getDefault(), |
| 24 NULL, // breakiter |
| 25 &status); |
| 26 if (U_SUCCESS(status)) { |
| 27 UCollator* collator = usearch_getCollator(search_); |
| 28 ucol_setStrength(collator, UCOL_PRIMARY); |
| 29 usearch_reset(search_); |
| 30 } |
| 31 } |
18 | 32 |
19 UStringSearch* search = usearch_open(find_this.data(), -1, | 33 FixedPatternStringSearchIgnoringCaseAndAccents:: |
20 in_this.data(), -1, | 34 ~FixedPatternStringSearchIgnoringCaseAndAccents() { |
21 uloc_getDefault(), | 35 if (search_) |
22 NULL, // breakiter | 36 usearch_close(search_); |
23 &status); | 37 } |
| 38 |
| 39 bool FixedPatternStringSearchIgnoringCaseAndAccents::Search( |
| 40 const string16& in_this, size_t* match_index, size_t* match_length) { |
| 41 UErrorCode status = U_ZERO_ERROR; |
| 42 usearch_setText(search_, in_this.data(), in_this.size(), &status); |
24 | 43 |
25 // Default to basic substring search if usearch fails. According to | 44 // Default to basic substring search if usearch fails. According to |
26 // http://icu-project.org/apiref/icu4c/usearch_8h.html, usearch_open will fail | 45 // http://icu-project.org/apiref/icu4c/usearch_8h.html, usearch_open will fail |
27 // if either |find_this| or |in_this| are empty. In either case basic | 46 // if either |find_this| or |in_this| are empty. In either case basic |
28 // substring search will give the correct return value. | 47 // substring search will give the correct return value. |
29 if (!U_SUCCESS(status)) { | 48 if (!U_SUCCESS(status)) { |
30 size_t index = in_this.find(find_this); | 49 size_t index = in_this.find(find_this_); |
31 if (index == string16::npos) { | 50 if (index == string16::npos) { |
32 return false; | 51 return false; |
33 } else { | 52 } else { |
34 if (match_index) | 53 if (match_index) |
35 *match_index = index; | 54 *match_index = index; |
36 if (match_length) | 55 if (match_length) |
37 *match_length = find_this.size(); | 56 *match_length = find_this_.size(); |
38 return true; | 57 return true; |
39 } | 58 } |
40 } | 59 } |
41 | 60 |
42 UCollator* collator = usearch_getCollator(search); | 61 int32_t index = usearch_first(search_, &status); |
43 ucol_setStrength(collator, strength); | 62 if (!U_SUCCESS(status) || index == USEARCH_DONE) |
44 usearch_reset(search); | |
45 | |
46 int32_t index = usearch_first(search, &status); | |
47 if (!U_SUCCESS(status) || index == USEARCH_DONE) { | |
48 usearch_close(search); | |
49 return false; | 63 return false; |
50 } | |
51 | |
52 if (match_index) | 64 if (match_index) |
53 *match_index = static_cast<size_t>(index); | 65 *match_index = static_cast<size_t>(index); |
54 if (match_length) | 66 if (match_length) |
55 *match_length = static_cast<size_t>(usearch_getMatchedLength(search)); | 67 *match_length = static_cast<size_t>(usearch_getMatchedLength(search_)); |
56 | |
57 usearch_close(search); | |
58 return true; | 68 return true; |
59 } | 69 } |
60 | 70 |
61 } // namespace | |
62 | |
63 namespace base { | |
64 namespace i18n { | |
65 | |
66 bool StringSearchIgnoringCaseAndAccents(const string16& find_this, | 71 bool StringSearchIgnoringCaseAndAccents(const string16& find_this, |
67 const string16& in_this, | 72 const string16& in_this, |
68 size_t* match_index, | 73 size_t* match_index, |
69 size_t* match_length) { | 74 size_t* match_length) { |
70 return CollationSensitiveStringSearch(find_this, | 75 return FixedPatternStringSearchIgnoringCaseAndAccents(find_this).Search( |
71 in_this, | 76 in_this, match_index, match_length); |
72 UCOL_PRIMARY, | |
73 match_index, | |
74 match_length); | |
75 } | 77 } |
76 | 78 |
77 } // namespace i18n | 79 } // namespace i18n |
78 } // namespace base | 80 } // namespace base |
OLD | NEW |