OLD | NEW |
| (Empty) |
1 // Copyright (c) 2011 The Chromium Authors. All rights reserved. | |
2 // Use of this source code is governed by a BSD-style license that can be | |
3 // found in the LICENSE file. | |
4 | |
5 #include "chrome/browser/autofill/credit_card_field.h" | |
6 | |
7 #include <stddef.h> | |
8 | |
9 #include "base/logging.h" | |
10 #include "base/memory/scoped_ptr.h" | |
11 #include "base/string16.h" | |
12 #include "base/string_util.h" | |
13 #include "base/utf_string_conversions.h" | |
14 #include "chrome/browser/autofill/autofill_field.h" | |
15 #include "chrome/browser/autofill/autofill_regex_constants.h" | |
16 #include "chrome/browser/autofill/autofill_scanner.h" | |
17 #include "chrome/browser/autofill/field_types.h" | |
18 #include "ui/base/l10n/l10n_util.h" | |
19 | |
20 // static | |
21 FormField* CreditCardField::Parse(AutofillScanner* scanner) { | |
22 if (scanner->IsEnd()) | |
23 return NULL; | |
24 | |
25 scoped_ptr<CreditCardField> credit_card_field(new CreditCardField); | |
26 size_t saved_cursor = scanner->SaveCursor(); | |
27 | |
28 // Credit card fields can appear in many different orders. | |
29 // We loop until no more credit card related fields are found, see |break| at | |
30 // bottom of the loop. | |
31 for (int fields = 0; !scanner->IsEnd(); ++fields) { | |
32 // Ignore gift card fields. | |
33 if (ParseField(scanner, UTF8ToUTF16(autofill::kGiftCardRe), NULL)) | |
34 break; | |
35 | |
36 // Sometimes the cardholder field is just labeled "name". Unfortunately this | |
37 // is a dangerously generic word to search for, since it will often match a | |
38 // name (not cardholder name) field before or after credit card fields. So | |
39 // we search for "name" only when we've already parsed at least one other | |
40 // credit card field and haven't yet parsed the expiration date (which | |
41 // usually appears at the end). | |
42 if (credit_card_field->cardholder_ == NULL) { | |
43 string16 name_pattern; | |
44 if (fields == 0 || credit_card_field->expiration_month_) { | |
45 // at beginning or end | |
46 name_pattern = UTF8ToUTF16(autofill::kNameOnCardRe); | |
47 } else { | |
48 name_pattern = UTF8ToUTF16(autofill::kNameOnCardContextualRe); | |
49 } | |
50 | |
51 if (ParseField(scanner, name_pattern, &credit_card_field->cardholder_)) | |
52 continue; | |
53 | |
54 // As a hard-coded hack for Expedia's billing pages (expedia_checkout.html | |
55 // and ExpediaBilling.html in our test suite), recognize separate fields | |
56 // for the cardholder's first and last name if they have the labels "cfnm" | |
57 // and "clnm". | |
58 scanner->SaveCursor(); | |
59 const AutofillField* first; | |
60 if (ParseField(scanner, ASCIIToUTF16("^cfnm"), &first) && | |
61 ParseField(scanner, ASCIIToUTF16("^clnm"), | |
62 &credit_card_field->cardholder_last_)) { | |
63 credit_card_field->cardholder_ = first; | |
64 continue; | |
65 } | |
66 scanner->Rewind(); | |
67 } | |
68 | |
69 // Check for a credit card type (Visa, MasterCard, etc.) field. | |
70 string16 type_pattern = UTF8ToUTF16(autofill::kCardTypeRe); | |
71 if (!credit_card_field->type_ && | |
72 ParseFieldSpecifics(scanner, type_pattern, | |
73 MATCH_DEFAULT | MATCH_SELECT, | |
74 &credit_card_field->type_)) { | |
75 continue; | |
76 } | |
77 | |
78 // We look for a card security code before we look for a credit | |
79 // card number and match the general term "number". The security code | |
80 // has a plethora of names; we've seen "verification #", | |
81 // "verification number", "card identification number" and others listed | |
82 // in the |pattern| below. | |
83 string16 pattern = UTF8ToUTF16(autofill::kCardCvcRe); | |
84 if (!credit_card_field->verification_ && | |
85 ParseField(scanner, pattern, &credit_card_field->verification_)) { | |
86 continue; | |
87 } | |
88 | |
89 pattern = UTF8ToUTF16(autofill::kCardNumberRe); | |
90 if (!credit_card_field->number_ && | |
91 ParseField(scanner, pattern, &credit_card_field->number_)) { | |
92 continue; | |
93 } | |
94 | |
95 if (LowerCaseEqualsASCII(scanner->Cursor()->form_control_type, "month")) { | |
96 credit_card_field->expiration_month_ = scanner->Cursor(); | |
97 scanner->Advance(); | |
98 } else { | |
99 // First try to parse split month/year expiration fields. | |
100 scanner->SaveCursor(); | |
101 pattern = UTF8ToUTF16(autofill::kExpirationMonthRe); | |
102 if (!credit_card_field->expiration_month_ && | |
103 ParseFieldSpecifics(scanner, pattern, MATCH_DEFAULT | MATCH_SELECT, | |
104 &credit_card_field->expiration_month_)) { | |
105 pattern = UTF8ToUTF16(autofill::kExpirationYearRe); | |
106 if (ParseFieldSpecifics(scanner, pattern, MATCH_DEFAULT | MATCH_SELECT, | |
107 &credit_card_field->expiration_year_)) { | |
108 continue; | |
109 } | |
110 } | |
111 | |
112 // If that fails, try to parse a combined expiration field. | |
113 if (!credit_card_field->expiration_date_) { | |
114 // Look for a 2-digit year first. | |
115 scanner->Rewind(); | |
116 pattern = UTF8ToUTF16(autofill::kExpirationDate2DigitYearRe); | |
117 // We allow <select> fields, because they're used e.g. on qvc.com. | |
118 if (ParseFieldSpecifics(scanner, pattern, | |
119 MATCH_LABEL | MATCH_VALUE | MATCH_TEXT | | |
120 MATCH_SELECT, | |
121 &credit_card_field->expiration_date_)) { | |
122 credit_card_field->is_two_digit_year_ = true; | |
123 continue; | |
124 } | |
125 | |
126 pattern = UTF8ToUTF16(autofill::kExpirationDateRe); | |
127 if (ParseFieldSpecifics(scanner, pattern, | |
128 MATCH_LABEL | MATCH_VALUE | MATCH_TEXT | | |
129 MATCH_SELECT, | |
130 &credit_card_field->expiration_date_)) { | |
131 continue; | |
132 } | |
133 } | |
134 | |
135 if (credit_card_field->expiration_month_ && | |
136 !credit_card_field->expiration_year_ && | |
137 !credit_card_field->expiration_date_) { | |
138 // Parsed a month but couldn't parse a year; give up. | |
139 scanner->RewindTo(saved_cursor); | |
140 return NULL; | |
141 } | |
142 } | |
143 | |
144 // Some pages (e.g. ExpediaBilling.html) have a "card description" | |
145 // field; we parse this field but ignore it. | |
146 // We also ignore any other fields within a credit card block that | |
147 // start with "card", under the assumption that they are related to | |
148 // the credit card section being processed but are uninteresting to us. | |
149 if (ParseField(scanner, UTF8ToUTF16(autofill::kCardIgnoredRe), NULL)) | |
150 continue; | |
151 | |
152 break; | |
153 } | |
154 | |
155 // Some pages have a billing address field after the cardholder name field. | |
156 // For that case, allow only just the cardholder name field. The remaining | |
157 // CC fields will be picked up in a following CreditCardField. | |
158 if (credit_card_field->cardholder_) | |
159 return credit_card_field.release(); | |
160 | |
161 // On some pages, the user selects a card type using radio buttons | |
162 // (e.g. test page Apple Store Billing.html). We can't handle that yet, | |
163 // so we treat the card type as optional for now. | |
164 // The existence of a number or cvc in combination with expiration date is | |
165 // a strong enough signal that this is a credit card. It is possible that | |
166 // the number and name were parsed in a separate part of the form. So if | |
167 // the cvc and date were found independently they are returned. | |
168 if ((credit_card_field->number_ || credit_card_field->verification_) && | |
169 (credit_card_field->expiration_date_ || | |
170 (credit_card_field->expiration_month_ && | |
171 (credit_card_field->expiration_year_ || | |
172 (LowerCaseEqualsASCII( | |
173 credit_card_field->expiration_month_->form_control_type, | |
174 "month")))))) { | |
175 return credit_card_field.release(); | |
176 } | |
177 | |
178 scanner->RewindTo(saved_cursor); | |
179 return NULL; | |
180 } | |
181 | |
182 CreditCardField::CreditCardField() | |
183 : cardholder_(NULL), | |
184 cardholder_last_(NULL), | |
185 type_(NULL), | |
186 number_(NULL), | |
187 verification_(NULL), | |
188 expiration_month_(NULL), | |
189 expiration_year_(NULL), | |
190 expiration_date_(NULL), | |
191 is_two_digit_year_(false) { | |
192 } | |
193 | |
194 bool CreditCardField::ClassifyField(FieldTypeMap* map) const { | |
195 bool ok = AddClassification(number_, CREDIT_CARD_NUMBER, map); | |
196 ok = ok && AddClassification(type_, CREDIT_CARD_TYPE, map); | |
197 ok = ok && AddClassification(verification_, CREDIT_CARD_VERIFICATION_CODE, | |
198 map); | |
199 | |
200 // If the heuristics detected first and last name in separate fields, | |
201 // then ignore both fields. Putting them into separate fields is probably | |
202 // wrong, because the credit card can also contain a middle name or middle | |
203 // initial. | |
204 if (cardholder_last_ == NULL) | |
205 ok = ok && AddClassification(cardholder_, CREDIT_CARD_NAME, map); | |
206 | |
207 if (expiration_date_) { | |
208 if (is_two_digit_year_) { | |
209 ok = ok && AddClassification(expiration_date_, | |
210 CREDIT_CARD_EXP_DATE_2_DIGIT_YEAR, map); | |
211 } else { | |
212 ok = ok && AddClassification(expiration_date_, | |
213 CREDIT_CARD_EXP_DATE_4_DIGIT_YEAR, map); | |
214 } | |
215 } else { | |
216 ok = ok && AddClassification(expiration_month_, CREDIT_CARD_EXP_MONTH, map); | |
217 if (is_two_digit_year_) { | |
218 ok = ok && AddClassification(expiration_year_, | |
219 CREDIT_CARD_EXP_2_DIGIT_YEAR, | |
220 map); | |
221 } else { | |
222 ok = ok && AddClassification(expiration_year_, | |
223 CREDIT_CARD_EXP_4_DIGIT_YEAR, | |
224 map); | |
225 } | |
226 } | |
227 | |
228 return ok; | |
229 } | |
OLD | NEW |