form_structure.cc revision ba5b9a6411cb1792fd21f0a078d7a25cd1ceec16
1// Copyright 2013 The Chromium Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
4
5#include "components/autofill/core/browser/form_structure.h"
6
7#include <utility>
8
9#include "base/basictypes.h"
10#include "base/command_line.h"
11#include "base/logging.h"
12#include "base/memory/scoped_ptr.h"
13#include "base/sha1.h"
14#include "base/strings/string_number_conversions.h"
15#include "base/strings/string_util.h"
16#include "base/strings/stringprintf.h"
17#include "base/strings/utf_string_conversions.h"
18#include "base/time/time.h"
19#include "components/autofill/content/browser/autocheckout_page_meta_data.h"
20#include "components/autofill/core/browser/autofill_metrics.h"
21#include "components/autofill/core/browser/autofill_type.h"
22#include "components/autofill/core/browser/autofill_xml_parser.h"
23#include "components/autofill/core/browser/field_types.h"
24#include "components/autofill/core/browser/form_field.h"
25#include "components/autofill/core/common/autofill_constants.h"
26#include "components/autofill/core/common/form_data.h"
27#include "components/autofill/core/common/form_data_predictions.h"
28#include "components/autofill/core/common/form_field_data.h"
29#include "components/autofill/core/common/form_field_data_predictions.h"
30#include "third_party/icu/source/i18n/unicode/regex.h"
31#include "third_party/libjingle/source/talk/xmllite/xmlelement.h"
32
33namespace autofill {
34namespace {
35
36const char kFormMethodPost[] = "post";
37
38// XML elements and attributes.
39const char kAttributeAcceptedFeatures[] = "accepts";
40const char kAttributeAutofillUsed[] = "autofillused";
41const char kAttributeAutofillType[] = "autofilltype";
42const char kAttributeClientVersion[] = "clientversion";
43const char kAttributeDataPresent[] = "datapresent";
44const char kAttributeFieldID[] = "fieldid";
45const char kAttributeFieldType[] = "fieldtype";
46const char kAttributeFormSignature[] = "formsignature";
47const char kAttributeName[] = "name";
48const char kAttributeSignature[] = "signature";
49const char kAttributeUrlprefixSignature[] = "urlprefixsignature";
50const char kAcceptedFeaturesExperiment[] = "e"; // e=experiments
51const char kAcceptedFeaturesAutocheckoutExperiment[] = "a,e"; // a=autocheckout
52const char kClientVersion[] = "6.1.1715.1442/en (GGLL)";
53const char kXMLDeclaration[] = "<?xml version=\"1.0\" encoding=\"UTF-8\"?>";
54const char kXMLElementAutofillQuery[] = "autofillquery";
55const char kXMLElementAutofillUpload[] = "autofillupload";
56const char kXMLElementFieldAssignments[] = "fieldassignments";
57const char kXMLElementField[] = "field";
58const char kXMLElementFields[] = "fields";
59const char kXMLElementForm[] = "form";
60const char kBillingMode[] = "billing";
61const char kShippingMode[] = "shipping";
62
63// Stip away >= 5 consecutive digits.
64const char kIgnorePatternInFieldName[] = "\\d{5,}+";
65
66// Helper for |EncodeUploadRequest()| that creates a bit field corresponding to
67// |available_field_types| and returns the hex representation as a string.
68std::string EncodeFieldTypes(const ServerFieldTypeSet& available_field_types) {
69  // There are |MAX_VALID_FIELD_TYPE| different field types and 8 bits per byte,
70  // so we need ceil(MAX_VALID_FIELD_TYPE / 8) bytes to encode the bit field.
71  const size_t kNumBytes = (MAX_VALID_FIELD_TYPE + 0x7) / 8;
72
73  // Pack the types in |available_field_types| into |bit_field|.
74  std::vector<uint8> bit_field(kNumBytes, 0);
75  for (ServerFieldTypeSet::const_iterator field_type =
76           available_field_types.begin();
77       field_type != available_field_types.end();
78       ++field_type) {
79    // Set the appropriate bit in the field.  The bit we set is the one
80    // |field_type| % 8 from the left of the byte.
81    const size_t byte = *field_type / 8;
82    const size_t bit = 0x80 >> (*field_type % 8);
83    DCHECK(byte < bit_field.size());
84    bit_field[byte] |= bit;
85  }
86
87  // Discard any trailing zeroes.
88  // If there are no available types, we return the empty string.
89  size_t data_end = bit_field.size();
90  for (; data_end > 0 && !bit_field[data_end - 1]; --data_end) {
91  }
92
93  // Print all meaningfull bytes into a string.
94  std::string data_presence;
95  data_presence.reserve(data_end * 2 + 1);
96  for (size_t i = 0; i < data_end; ++i) {
97    base::StringAppendF(&data_presence, "%02x", bit_field[i]);
98  }
99
100  return data_presence;
101}
102
103// Helper for |EncodeFormRequest()| that creates XmlElements for the given field
104// in upload xml, and also add them to the parent XmlElement.
105void EncodeFieldForUpload(const AutofillField& field,
106                          buzz::XmlElement* parent) {
107  // Don't upload checkable fields.
108  if (field.is_checkable)
109    return;
110
111  ServerFieldTypeSet types = field.possible_types();
112  // |types| could be empty in unit-tests only.
113  for (ServerFieldTypeSet::iterator field_type = types.begin();
114       field_type != types.end(); ++field_type) {
115    buzz::XmlElement *field_element = new buzz::XmlElement(
116        buzz::QName(kXMLElementField));
117
118    field_element->SetAttr(buzz::QName(kAttributeSignature),
119                           field.FieldSignature());
120    field_element->SetAttr(buzz::QName(kAttributeAutofillType),
121                           base::IntToString(*field_type));
122    parent->AddElement(field_element);
123  }
124}
125
126// Helper for |EncodeFormRequest()| that creates XmlElement for the given field
127// in query xml, and also add it to the parent XmlElement.
128void EncodeFieldForQuery(const AutofillField& field,
129                         buzz::XmlElement* parent) {
130  buzz::XmlElement *field_element = new buzz::XmlElement(
131      buzz::QName(kXMLElementField));
132  field_element->SetAttr(buzz::QName(kAttributeSignature),
133                         field.FieldSignature());
134  parent->AddElement(field_element);
135}
136
137// Helper for |EncodeFormRequest()| that creates XmlElements for the given field
138// in field assignments xml, and also add them to the parent XmlElement.
139void EncodeFieldForFieldAssignments(const AutofillField& field,
140                                    buzz::XmlElement* parent) {
141  ServerFieldTypeSet types = field.possible_types();
142  for (ServerFieldTypeSet::iterator field_type = types.begin();
143       field_type != types.end(); ++field_type) {
144    buzz::XmlElement *field_element = new buzz::XmlElement(
145        buzz::QName(kXMLElementFields));
146
147    field_element->SetAttr(buzz::QName(kAttributeFieldID),
148                           field.FieldSignature());
149    field_element->SetAttr(buzz::QName(kAttributeFieldType),
150                           base::IntToString(*field_type));
151    field_element->SetAttr(buzz::QName(kAttributeName),
152                           UTF16ToUTF8(field.name));
153    parent->AddElement(field_element);
154  }
155}
156
157// Returns |true| iff the |token| is a type hint for a contact field, as
158// specified in the implementation section of http://is.gd/whatwg_autocomplete
159// Note that "fax" and "pager" are intentionally ignored, as Chrome does not
160// support filling either type of information.
161bool IsContactTypeHint(const std::string& token) {
162  return token == "home" || token == "work" || token == "mobile";
163}
164
165// Returns |true| iff the |token| is a type hint appropriate for a field of the
166// given |field_type|, as specified in the implementation section of
167// http://is.gd/whatwg_autocomplete
168bool ContactTypeHintMatchesFieldType(const std::string& token,
169                                     HtmlFieldType field_type) {
170  // The "home" and "work" type hints are only appropriate for email and phone
171  // number field types.
172  if (token == "home" || token == "work") {
173    return field_type == HTML_TYPE_EMAIL ||
174        (field_type >= HTML_TYPE_TEL &&
175         field_type <= HTML_TYPE_TEL_LOCAL_SUFFIX);
176  }
177
178  // The "mobile" type hint is only appropriate for phone number field types.
179  // Note that "fax" and "pager" are intentionally ignored, as Chrome does not
180  // support filling either type of information.
181  if (token == "mobile") {
182    return field_type >= HTML_TYPE_TEL &&
183        field_type <= HTML_TYPE_TEL_LOCAL_SUFFIX;
184  }
185
186  return false;
187}
188
189// Returns the Chrome Autofill-supported field type corresponding to the given
190// |autocomplete_attribute_value|, if there is one, in the context of the given
191// |field|.  Chrome Autofill supports a subset of the field types listed at
192// http://is.gd/whatwg_autocomplete
193HtmlFieldType FieldTypeFromAutocompleteAttributeValue(
194    const std::string& autocomplete_attribute_value,
195    const AutofillField& field) {
196  if (autocomplete_attribute_value == "name")
197    return HTML_TYPE_NAME;
198
199  if (autocomplete_attribute_value == "given-name")
200    return HTML_TYPE_GIVEN_NAME;
201
202  if (autocomplete_attribute_value == "additional-name") {
203    if (field.max_length == 1)
204      return HTML_TYPE_ADDITIONAL_NAME_INITIAL;
205    else
206      return HTML_TYPE_ADDITIONAL_NAME;
207  }
208
209  if (autocomplete_attribute_value == "family-name")
210    return HTML_TYPE_FAMILY_NAME;
211
212  if (autocomplete_attribute_value == "organization")
213    return HTML_TYPE_ORGANIZATION;
214
215  if (autocomplete_attribute_value == "street-address")
216    return HTML_TYPE_STREET_ADDRESS;
217
218  if (autocomplete_attribute_value == "address-line1")
219    return HTML_TYPE_ADDRESS_LINE1;
220
221  if (autocomplete_attribute_value == "address-line2")
222    return HTML_TYPE_ADDRESS_LINE2;
223
224  if (autocomplete_attribute_value == "locality")
225    return HTML_TYPE_LOCALITY;
226
227  if (autocomplete_attribute_value == "region")
228    return HTML_TYPE_REGION;
229
230  if (autocomplete_attribute_value == "country")
231    return HTML_TYPE_COUNTRY_CODE;
232
233  if (autocomplete_attribute_value == "country-name")
234    return HTML_TYPE_COUNTRY_NAME;
235
236  if (autocomplete_attribute_value == "postal-code")
237    return HTML_TYPE_POSTAL_CODE;
238
239  if (autocomplete_attribute_value == "cc-name")
240    return HTML_TYPE_CREDIT_CARD_NAME;
241
242  if (autocomplete_attribute_value == "cc-number")
243    return HTML_TYPE_CREDIT_CARD_NUMBER;
244
245  if (autocomplete_attribute_value == "cc-exp") {
246    if (field.max_length == 5)
247      return HTML_TYPE_CREDIT_CARD_EXP_DATE_2_DIGIT_YEAR;
248    else if (field.max_length == 7)
249      return HTML_TYPE_CREDIT_CARD_EXP_DATE_4_DIGIT_YEAR;
250    else
251      return HTML_TYPE_CREDIT_CARD_EXP;
252  }
253
254  if (autocomplete_attribute_value == "cc-exp-month")
255    return HTML_TYPE_CREDIT_CARD_EXP_MONTH;
256
257  if (autocomplete_attribute_value == "cc-exp-year") {
258    if (field.max_length == 2)
259      return HTML_TYPE_CREDIT_CARD_EXP_2_DIGIT_YEAR;
260    else if (field.max_length == 4)
261      return HTML_TYPE_CREDIT_CARD_EXP_4_DIGIT_YEAR;
262    else
263      return HTML_TYPE_CREDIT_CARD_EXP_YEAR;
264  }
265
266  if (autocomplete_attribute_value == "cc-csc")
267    return HTML_TYPE_CREDIT_CARD_VERIFICATION_CODE;
268
269  if (autocomplete_attribute_value == "cc-type")
270    return HTML_TYPE_CREDIT_CARD_TYPE;
271
272  if (autocomplete_attribute_value == "tel")
273    return HTML_TYPE_TEL;
274
275  if (autocomplete_attribute_value == "tel-country-code")
276    return HTML_TYPE_TEL_COUNTRY_CODE;
277
278  if (autocomplete_attribute_value == "tel-national")
279    return HTML_TYPE_TEL_NATIONAL;
280
281  if (autocomplete_attribute_value == "tel-area-code")
282    return HTML_TYPE_TEL_AREA_CODE;
283
284  if (autocomplete_attribute_value == "tel-local")
285    return HTML_TYPE_TEL_LOCAL;
286
287  if (autocomplete_attribute_value == "tel-local-prefix")
288    return HTML_TYPE_TEL_LOCAL_PREFIX;
289
290  if (autocomplete_attribute_value == "tel-local-suffix")
291    return HTML_TYPE_TEL_LOCAL_SUFFIX;
292
293  if (autocomplete_attribute_value == "email")
294    return HTML_TYPE_EMAIL;
295
296  return HTML_TYPE_UNKNOWN;
297}
298
299std::string StripDigitsIfRequired(const base::string16& input) {
300  UErrorCode status = U_ZERO_ERROR;
301  CR_DEFINE_STATIC_LOCAL(icu::UnicodeString, icu_pattern,
302                         (kIgnorePatternInFieldName));
303  CR_DEFINE_STATIC_LOCAL(icu::RegexMatcher, matcher,
304                         (icu_pattern, UREGEX_CASE_INSENSITIVE, status));
305  DCHECK_EQ(status, U_ZERO_ERROR);
306
307  icu::UnicodeString icu_input(input.data(), input.length());
308  matcher.reset(icu_input);
309
310  icu::UnicodeString replaced_string = matcher.replaceAll("", status);
311
312  std::string return_string;
313  status = U_ZERO_ERROR;
314  UTF16ToUTF8(replaced_string.getBuffer(),
315              static_cast<size_t>(replaced_string.length()),
316              &return_string);
317  if (status != U_ZERO_ERROR) {
318    DVLOG(1) << "Couldn't strip digits in " << UTF16ToUTF8(input);
319    return UTF16ToUTF8(input);
320  }
321
322  return return_string;
323}
324
325}  // namespace
326
327FormStructure::FormStructure(const FormData& form,
328                             const std::string& autocheckout_url_prefix)
329    : form_name_(form.name),
330      source_url_(form.origin),
331      target_url_(form.action),
332      autofill_count_(0),
333      active_field_count_(0),
334      upload_required_(USE_UPLOAD_RATES),
335      server_experiment_id_("no server response"),
336      has_author_specified_types_(false),
337      autocheckout_url_prefix_(autocheckout_url_prefix),
338      filled_by_autocheckout_(false) {
339  // Copy the form fields.
340  std::map<base::string16, size_t> unique_names;
341  for (std::vector<FormFieldData>::const_iterator field =
342           form.fields.begin();
343       field != form.fields.end(); field++) {
344
345    if (!ShouldSkipField(*field)) {
346      // Add all supported form fields (including with empty names) to the
347      // signature.  This is a requirement for Autofill servers.
348      form_signature_field_names_.append("&");
349      form_signature_field_names_.append(StripDigitsIfRequired(field->name));
350
351      ++active_field_count_;
352    }
353
354    // Generate a unique name for this field by appending a counter to the name.
355    // Make sure to prepend the counter with a non-numeric digit so that we are
356    // guaranteed to avoid collisions.
357    if (!unique_names.count(field->name))
358      unique_names[field->name] = 1;
359    else
360      ++unique_names[field->name];
361    base::string16 unique_name = field->name + ASCIIToUTF16("_") +
362        base::IntToString16(unique_names[field->name]);
363    fields_.push_back(new AutofillField(*field, unique_name));
364  }
365
366  std::string method = UTF16ToUTF8(form.method);
367  if (StringToLowerASCII(method) == kFormMethodPost) {
368    method_ = POST;
369  } else {
370    // Either the method is 'get', or we don't know.  In this case we default
371    // to GET.
372    method_ = GET;
373  }
374}
375
376FormStructure::~FormStructure() {}
377
378void FormStructure::DetermineHeuristicTypes(
379    const AutofillMetrics& metric_logger) {
380  // First, try to detect field types based on each field's |autocomplete|
381  // attribute value.  If there is at least one form field that specifies an
382  // autocomplete type hint, don't try to apply other heuristics to match fields
383  // in this form.
384  bool has_author_specified_sections;
385  ParseFieldTypesFromAutocompleteAttributes(&has_author_specified_types_,
386                                            &has_author_specified_sections);
387
388  if (!has_author_specified_types_) {
389    ServerFieldTypeMap field_type_map;
390    FormField::ParseFormFields(fields_.get(), &field_type_map);
391    for (size_t i = 0; i < field_count(); ++i) {
392      AutofillField* field = fields_[i];
393      ServerFieldTypeMap::iterator iter =
394          field_type_map.find(field->unique_name());
395      if (iter != field_type_map.end())
396        field->set_heuristic_type(iter->second);
397    }
398  }
399
400  UpdateAutofillCount();
401  IdentifySections(has_author_specified_sections);
402
403  if (IsAutofillable(true)) {
404    metric_logger.LogDeveloperEngagementMetric(
405        AutofillMetrics::FILLABLE_FORM_PARSED);
406    if (has_author_specified_types_) {
407      metric_logger.LogDeveloperEngagementMetric(
408          AutofillMetrics::FILLABLE_FORM_CONTAINS_TYPE_HINTS);
409    }
410  }
411}
412
413bool FormStructure::EncodeUploadRequest(
414    const ServerFieldTypeSet& available_field_types,
415    bool form_was_autofilled,
416    std::string* encoded_xml) const {
417  DCHECK(ShouldBeCrowdsourced());
418
419  // Verify that |available_field_types| agrees with the possible field types we
420  // are uploading.
421  for (std::vector<AutofillField*>::const_iterator field = begin();
422       field != end();
423       ++field) {
424    for (ServerFieldTypeSet::const_iterator type =
425             (*field)->possible_types().begin();
426         type != (*field)->possible_types().end();
427         ++type) {
428      DCHECK(*type == UNKNOWN_TYPE ||
429             *type == EMPTY_TYPE ||
430             available_field_types.count(*type));
431    }
432  }
433
434  // Set up the <autofillupload> element and its attributes.
435  buzz::XmlElement autofill_request_xml(
436      (buzz::QName(kXMLElementAutofillUpload)));
437  autofill_request_xml.SetAttr(buzz::QName(kAttributeClientVersion),
438                               kClientVersion);
439  autofill_request_xml.SetAttr(buzz::QName(kAttributeFormSignature),
440                               FormSignature());
441  autofill_request_xml.SetAttr(buzz::QName(kAttributeAutofillUsed),
442                               form_was_autofilled ? "true" : "false");
443  autofill_request_xml.SetAttr(buzz::QName(kAttributeDataPresent),
444                               EncodeFieldTypes(available_field_types).c_str());
445
446  if (!EncodeFormRequest(FormStructure::UPLOAD, &autofill_request_xml))
447    return false;  // Malformed form, skip it.
448
449  // Obtain the XML structure as a string.
450  *encoded_xml = kXMLDeclaration;
451  *encoded_xml += autofill_request_xml.Str().c_str();
452
453  // To enable this logging, run with the flag --vmodule="form_structure=2".
454  VLOG(2) << "\n" << *encoded_xml;
455
456  return true;
457}
458
459bool FormStructure::EncodeFieldAssignments(
460    const ServerFieldTypeSet& available_field_types,
461    std::string* encoded_xml) const {
462  DCHECK(ShouldBeCrowdsourced());
463
464  // Set up the <fieldassignments> element and its attributes.
465  buzz::XmlElement autofill_request_xml(
466      (buzz::QName(kXMLElementFieldAssignments)));
467  autofill_request_xml.SetAttr(buzz::QName(kAttributeFormSignature),
468                               FormSignature());
469
470  if (!EncodeFormRequest(FormStructure::FIELD_ASSIGNMENTS,
471                         &autofill_request_xml))
472    return false;  // Malformed form, skip it.
473
474  // Obtain the XML structure as a string.
475  *encoded_xml = kXMLDeclaration;
476  *encoded_xml += autofill_request_xml.Str().c_str();
477
478  return true;
479}
480
481// static
482bool FormStructure::EncodeQueryRequest(
483    const std::vector<FormStructure*>& forms,
484    std::vector<std::string>* encoded_signatures,
485    std::string* encoded_xml) {
486  DCHECK(encoded_signatures);
487  DCHECK(encoded_xml);
488  encoded_xml->clear();
489  encoded_signatures->clear();
490  encoded_signatures->reserve(forms.size());
491
492  // Set up the <autofillquery> element and attributes.
493  buzz::XmlElement autofill_request_xml(
494      (buzz::QName(kXMLElementAutofillQuery)));
495  autofill_request_xml.SetAttr(buzz::QName(kAttributeClientVersion),
496                               kClientVersion);
497
498  // autocheckout_url_prefix tells the Autofill server where the forms in the
499  // request came from, and the the Autofill server checks internal status and
500  // decide to enable Autocheckout or not and may return Autocheckout related
501  // data in the response accordingly.
502  // There is no page/frame level object associated with FormStructure that
503  // we could extract URL prefix from. But, all the forms should come from the
504  // same frame, so they should have the same Autocheckout URL prefix. Thus we
505  // use URL prefix from the first form with Autocheckout enabled.
506  std::string autocheckout_url_prefix;
507
508  // Some badly formatted web sites repeat forms - detect that and encode only
509  // one form as returned data would be the same for all the repeated forms.
510  std::set<std::string> processed_forms;
511  for (ScopedVector<FormStructure>::const_iterator it = forms.begin();
512       it != forms.end();
513       ++it) {
514    std::string signature((*it)->FormSignature());
515    if (processed_forms.find(signature) != processed_forms.end())
516      continue;
517    processed_forms.insert(signature);
518    scoped_ptr<buzz::XmlElement> encompassing_xml_element(
519        new buzz::XmlElement(buzz::QName(kXMLElementForm)));
520    encompassing_xml_element->SetAttr(buzz::QName(kAttributeSignature),
521                                      signature);
522
523    if (!(*it)->EncodeFormRequest(FormStructure::QUERY,
524                                  encompassing_xml_element.get()))
525      continue;  // Malformed form, skip it.
526
527    if ((*it)->IsAutocheckoutEnabled()) {
528      if (autocheckout_url_prefix.empty()) {
529        autocheckout_url_prefix = (*it)->autocheckout_url_prefix_;
530      } else {
531        // Making sure all the forms in the request has the same url_prefix.
532        DCHECK_EQ(autocheckout_url_prefix, (*it)->autocheckout_url_prefix_);
533      }
534    }
535
536    autofill_request_xml.AddElement(encompassing_xml_element.release());
537    encoded_signatures->push_back(signature);
538  }
539
540  if (!encoded_signatures->size())
541    return false;
542
543  if (autocheckout_url_prefix.empty()) {
544    autofill_request_xml.SetAttr(buzz::QName(kAttributeAcceptedFeatures),
545                                 kAcceptedFeaturesExperiment);
546  } else {
547    autofill_request_xml.SetAttr(buzz::QName(kAttributeAcceptedFeatures),
548                                 kAcceptedFeaturesAutocheckoutExperiment);
549    autofill_request_xml.SetAttr(buzz::QName(kAttributeUrlprefixSignature),
550                                 Hash64Bit(autocheckout_url_prefix));
551  }
552
553  // Obtain the XML structure as a string.
554  *encoded_xml = kXMLDeclaration;
555  *encoded_xml += autofill_request_xml.Str().c_str();
556
557  return true;
558}
559
560// static
561void FormStructure::ParseQueryResponse(
562    const std::string& response_xml,
563    const std::vector<FormStructure*>& forms,
564    autofill::AutocheckoutPageMetaData* page_meta_data,
565    const AutofillMetrics& metric_logger) {
566  metric_logger.LogServerQueryMetric(AutofillMetrics::QUERY_RESPONSE_RECEIVED);
567
568  // Parse the field types from the server response to the query.
569  std::vector<AutofillServerFieldInfo> field_infos;
570  UploadRequired upload_required;
571  std::string experiment_id;
572  AutofillQueryXmlParser parse_handler(&field_infos,
573                                       &upload_required,
574                                       &experiment_id,
575                                       page_meta_data);
576  buzz::XmlParser parser(&parse_handler);
577  parser.Parse(response_xml.c_str(), response_xml.length(), true);
578  if (!parse_handler.succeeded())
579    return;
580
581  metric_logger.LogServerQueryMetric(AutofillMetrics::QUERY_RESPONSE_PARSED);
582  metric_logger.LogServerExperimentIdForQuery(experiment_id);
583
584  bool heuristics_detected_fillable_field = false;
585  bool query_response_overrode_heuristics = false;
586
587  // Copy the field types into the actual form.
588  std::vector<AutofillServerFieldInfo>::iterator current_info =
589      field_infos.begin();
590  for (std::vector<FormStructure*>::const_iterator iter = forms.begin();
591       iter != forms.end(); ++iter) {
592    FormStructure* form = *iter;
593    form->upload_required_ = upload_required;
594    form->server_experiment_id_ = experiment_id;
595
596    for (std::vector<AutofillField*>::iterator field = form->fields_.begin();
597         field != form->fields_.end(); ++field) {
598      if (form->ShouldSkipField(**field))
599        continue;
600
601      // In some cases *successful* response does not return all the fields.
602      // Quit the update of the types then.
603      if (current_info == field_infos.end())
604        break;
605
606      // UNKNOWN_TYPE is reserved for use by the client.
607      DCHECK_NE(current_info->field_type, UNKNOWN_TYPE);
608
609      ServerFieldType heuristic_type = (*field)->heuristic_type();
610      if (heuristic_type != UNKNOWN_TYPE)
611        heuristics_detected_fillable_field = true;
612
613      (*field)->set_server_type(current_info->field_type);
614      if (heuristic_type != (*field)->Type().GetStorableType())
615        query_response_overrode_heuristics = true;
616
617      // Copy default value into the field if available.
618      if (!current_info->default_value.empty())
619        (*field)->set_default_value(current_info->default_value);
620
621      ++current_info;
622    }
623
624    form->UpdateAutofillCount();
625    form->IdentifySections(false);
626  }
627
628  AutofillMetrics::ServerQueryMetric metric;
629  if (query_response_overrode_heuristics) {
630    if (heuristics_detected_fillable_field) {
631      metric = AutofillMetrics::QUERY_RESPONSE_OVERRODE_LOCAL_HEURISTICS;
632    } else {
633      metric = AutofillMetrics::QUERY_RESPONSE_WITH_NO_LOCAL_HEURISTICS;
634    }
635  } else {
636    metric = AutofillMetrics::QUERY_RESPONSE_MATCHED_LOCAL_HEURISTICS;
637  }
638  metric_logger.LogServerQueryMetric(metric);
639}
640
641// static
642void FormStructure::GetFieldTypePredictions(
643    const std::vector<FormStructure*>& form_structures,
644    std::vector<FormDataPredictions>* forms) {
645  forms->clear();
646  forms->reserve(form_structures.size());
647  for (size_t i = 0; i < form_structures.size(); ++i) {
648    FormStructure* form_structure = form_structures[i];
649    FormDataPredictions form;
650    form.data.name = form_structure->form_name_;
651    form.data.method =
652        ASCIIToUTF16((form_structure->method_ == POST) ? "POST" : "GET");
653    form.data.origin = form_structure->source_url_;
654    form.data.action = form_structure->target_url_;
655    form.signature = form_structure->FormSignature();
656    form.experiment_id = form_structure->server_experiment_id_;
657
658    for (std::vector<AutofillField*>::const_iterator field =
659             form_structure->fields_.begin();
660         field != form_structure->fields_.end(); ++field) {
661      form.data.fields.push_back(FormFieldData(**field));
662
663      FormFieldDataPredictions annotated_field;
664      annotated_field.signature = (*field)->FieldSignature();
665      annotated_field.heuristic_type =
666          AutofillType((*field)->heuristic_type()).ToString();
667      annotated_field.server_type =
668          AutofillType((*field)->server_type()).ToString();
669      annotated_field.overall_type = (*field)->Type().ToString();
670      form.fields.push_back(annotated_field);
671    }
672
673    forms->push_back(form);
674  }
675}
676
677std::string FormStructure::FormSignature() const {
678  std::string scheme(target_url_.scheme());
679  std::string host(target_url_.host());
680
681  // If target host or scheme is empty, set scheme and host of source url.
682  // This is done to match the Toolbar's behavior.
683  if (scheme.empty() || host.empty()) {
684    scheme = source_url_.scheme();
685    host = source_url_.host();
686  }
687
688  std::string form_string = scheme + "://" + host + "&" +
689                            UTF16ToUTF8(form_name_) +
690                            form_signature_field_names_;
691
692  return Hash64Bit(form_string);
693}
694
695bool FormStructure::IsAutocheckoutEnabled() const {
696  return !autocheckout_url_prefix_.empty();
697}
698
699bool FormStructure::ShouldSkipField(const FormFieldData& field) const {
700  return (field.is_checkable || field.form_control_type == "password") &&
701      !IsAutocheckoutEnabled();
702}
703
704size_t FormStructure::RequiredFillableFields() const {
705  return IsAutocheckoutEnabled() ? 0 : kRequiredAutofillFields;
706}
707
708bool FormStructure::IsAutofillable(bool require_method_post) const {
709  if (autofill_count() < RequiredFillableFields())
710    return false;
711
712  return ShouldBeParsed(require_method_post);
713}
714
715void FormStructure::UpdateAutofillCount() {
716  autofill_count_ = 0;
717  for (std::vector<AutofillField*>::const_iterator iter = begin();
718       iter != end(); ++iter) {
719    AutofillField* field = *iter;
720    if (field && field->IsFieldFillable())
721      ++autofill_count_;
722  }
723}
724
725bool FormStructure::ShouldBeParsed(bool require_method_post) const {
726  if (active_field_count() < RequiredFillableFields())
727    return false;
728
729  // Rule out http(s)://*/search?...
730  //  e.g. http://www.google.com/search?q=...
731  //       http://search.yahoo.com/search?p=...
732  if (target_url_.path() == "/search")
733    return false;
734
735  if (!IsAutocheckoutEnabled()) {
736    // Make sure there is at least one text field when Autocheckout is
737    // not enabled.
738    bool has_text_field = false;
739    for (std::vector<AutofillField*>::const_iterator it = begin();
740         it != end() && !has_text_field; ++it) {
741      has_text_field |= (*it)->form_control_type != "select-one";
742    }
743    if (!has_text_field)
744      return false;
745  }
746
747  return !require_method_post || (method_ == POST);
748}
749
750bool FormStructure::ShouldBeCrowdsourced() const {
751  // Allow all forms in Autocheckout flow to be crowdsourced.
752  return (!has_author_specified_types_ && ShouldBeParsed(true)) ||
753      IsAutocheckoutEnabled();
754}
755
756void FormStructure::UpdateFromCache(const FormStructure& cached_form) {
757  // Map from field signatures to cached fields.
758  std::map<std::string, const AutofillField*> cached_fields;
759  for (size_t i = 0; i < cached_form.field_count(); ++i) {
760    const AutofillField* field = cached_form.field(i);
761    cached_fields[field->FieldSignature()] = field;
762  }
763
764  for (std::vector<AutofillField*>::const_iterator iter = begin();
765       iter != end(); ++iter) {
766    AutofillField* field = *iter;
767
768    std::map<std::string, const AutofillField*>::const_iterator
769        cached_field = cached_fields.find(field->FieldSignature());
770    if (cached_field != cached_fields.end()) {
771      if (field->form_control_type != "select-one" &&
772          field->value == cached_field->second->value) {
773        // From the perspective of learning user data, text fields containing
774        // default values are equivalent to empty fields.
775        field->value = base::string16();
776      }
777
778      field->set_heuristic_type(cached_field->second->heuristic_type());
779      field->set_server_type(cached_field->second->server_type());
780    }
781  }
782
783  UpdateAutofillCount();
784
785  filled_by_autocheckout_ = cached_form.filled_by_autocheckout();
786  server_experiment_id_ = cached_form.server_experiment_id();
787
788  // The form signature should match between query and upload requests to the
789  // server. On many websites, form elements are dynamically added, removed, or
790  // rearranged via JavaScript between page load and form submission, so we
791  // copy over the |form_signature_field_names_| corresponding to the query
792  // request.
793  DCHECK_EQ(cached_form.form_name_, form_name_);
794  DCHECK_EQ(cached_form.source_url_, source_url_);
795  DCHECK_EQ(cached_form.target_url_, target_url_);
796  form_signature_field_names_ = cached_form.form_signature_field_names_;
797}
798
799void FormStructure::LogQualityMetrics(
800    const AutofillMetrics& metric_logger,
801    const base::TimeTicks& load_time,
802    const base::TimeTicks& interaction_time,
803    const base::TimeTicks& submission_time) const {
804  std::string experiment_id = server_experiment_id();
805  metric_logger.LogServerExperimentIdForUpload(experiment_id);
806
807  size_t num_detected_field_types = 0;
808  bool did_autofill_all_possible_fields = true;
809  bool did_autofill_some_possible_fields = false;
810  for (size_t i = 0; i < field_count(); ++i) {
811    const AutofillField* field = this->field(i);
812    metric_logger.LogQualityMetric(AutofillMetrics::FIELD_SUBMITTED,
813                                   experiment_id);
814
815    // No further logging for empty fields nor for fields where the entered data
816    // does not appear to already exist in the user's stored Autofill data.
817    const ServerFieldTypeSet& field_types = field->possible_types();
818    DCHECK(!field_types.empty());
819    if (field_types.count(EMPTY_TYPE) || field_types.count(UNKNOWN_TYPE))
820      continue;
821
822    ++num_detected_field_types;
823    if (field->is_autofilled)
824      did_autofill_some_possible_fields = true;
825    else
826      did_autofill_all_possible_fields = false;
827
828    // Collapse field types that Chrome treats as identical, e.g. home and
829    // billing address fields.
830    ServerFieldTypeSet collapsed_field_types;
831    for (ServerFieldTypeSet::const_iterator it = field_types.begin();
832         it != field_types.end();
833         ++it) {
834      // Since we currently only support US phone numbers, the (city code + main
835      // digits) number is almost always identical to the whole phone number.
836      // TODO(isherman): Improve this logic once we add support for
837      // international numbers.
838      if (*it == PHONE_HOME_CITY_AND_NUMBER)
839        collapsed_field_types.insert(PHONE_HOME_WHOLE_NUMBER);
840      else
841        collapsed_field_types.insert(AutofillType(*it).GetStorableType());
842    }
843
844    // Capture the field's type, if it is unambiguous.
845    ServerFieldType field_type = UNKNOWN_TYPE;
846    if (collapsed_field_types.size() == 1)
847      field_type = *collapsed_field_types.begin();
848
849    ServerFieldType heuristic_type =
850        AutofillType(field->heuristic_type()).GetStorableType();
851    ServerFieldType server_type =
852        AutofillType(field->server_type()).GetStorableType();
853    ServerFieldType predicted_type = field->Type().GetStorableType();
854
855    // Log heuristic, server, and overall type quality metrics, independently of
856    // whether the field was autofilled.
857    if (heuristic_type == UNKNOWN_TYPE) {
858      metric_logger.LogHeuristicTypePrediction(AutofillMetrics::TYPE_UNKNOWN,
859                                               field_type, experiment_id);
860    } else if (field_types.count(heuristic_type)) {
861      metric_logger.LogHeuristicTypePrediction(AutofillMetrics::TYPE_MATCH,
862                                               field_type, experiment_id);
863    } else {
864      metric_logger.LogHeuristicTypePrediction(AutofillMetrics::TYPE_MISMATCH,
865                                               field_type, experiment_id);
866    }
867
868    if (server_type == NO_SERVER_DATA) {
869      metric_logger.LogServerTypePrediction(AutofillMetrics::TYPE_UNKNOWN,
870                                            field_type, experiment_id);
871    } else if (field_types.count(server_type)) {
872      metric_logger.LogServerTypePrediction(AutofillMetrics::TYPE_MATCH,
873                                            field_type, experiment_id);
874    } else {
875      metric_logger.LogServerTypePrediction(AutofillMetrics::TYPE_MISMATCH,
876                                            field_type, experiment_id);
877    }
878
879    if (predicted_type == UNKNOWN_TYPE) {
880      metric_logger.LogOverallTypePrediction(AutofillMetrics::TYPE_UNKNOWN,
881                                             field_type, experiment_id);
882    } else if (field_types.count(predicted_type)) {
883      metric_logger.LogOverallTypePrediction(AutofillMetrics::TYPE_MATCH,
884                                             field_type, experiment_id);
885    } else {
886      metric_logger.LogOverallTypePrediction(AutofillMetrics::TYPE_MISMATCH,
887                                             field_type, experiment_id);
888    }
889
890    // TODO(isherman): <select> fields don't support |is_autofilled()|, so we
891    // have to skip them for the remaining metrics.
892    if (field->form_control_type == "select-one")
893      continue;
894
895    if (field->is_autofilled) {
896      metric_logger.LogQualityMetric(AutofillMetrics::FIELD_AUTOFILLED,
897                                     experiment_id);
898    } else {
899      metric_logger.LogQualityMetric(AutofillMetrics::FIELD_NOT_AUTOFILLED,
900                                     experiment_id);
901
902      if (heuristic_type == UNKNOWN_TYPE) {
903        metric_logger.LogQualityMetric(
904            AutofillMetrics::NOT_AUTOFILLED_HEURISTIC_TYPE_UNKNOWN,
905            experiment_id);
906      } else if (field_types.count(heuristic_type)) {
907        metric_logger.LogQualityMetric(
908            AutofillMetrics::NOT_AUTOFILLED_HEURISTIC_TYPE_MATCH,
909            experiment_id);
910      } else {
911        metric_logger.LogQualityMetric(
912            AutofillMetrics::NOT_AUTOFILLED_HEURISTIC_TYPE_MISMATCH,
913            experiment_id);
914      }
915
916      if (server_type == NO_SERVER_DATA) {
917        metric_logger.LogQualityMetric(
918            AutofillMetrics::NOT_AUTOFILLED_SERVER_TYPE_UNKNOWN,
919            experiment_id);
920      } else if (field_types.count(server_type)) {
921        metric_logger.LogQualityMetric(
922            AutofillMetrics::NOT_AUTOFILLED_SERVER_TYPE_MATCH,
923            experiment_id);
924      } else {
925        metric_logger.LogQualityMetric(
926            AutofillMetrics::NOT_AUTOFILLED_SERVER_TYPE_MISMATCH,
927            experiment_id);
928      }
929    }
930  }
931
932  if (num_detected_field_types < RequiredFillableFields()) {
933    metric_logger.LogUserHappinessMetric(
934        AutofillMetrics::SUBMITTED_NON_FILLABLE_FORM);
935  } else {
936    if (did_autofill_all_possible_fields) {
937      metric_logger.LogUserHappinessMetric(
938          AutofillMetrics::SUBMITTED_FILLABLE_FORM_AUTOFILLED_ALL);
939    } else if (did_autofill_some_possible_fields) {
940      metric_logger.LogUserHappinessMetric(
941          AutofillMetrics::SUBMITTED_FILLABLE_FORM_AUTOFILLED_SOME);
942    } else {
943      metric_logger.LogUserHappinessMetric(
944          AutofillMetrics::SUBMITTED_FILLABLE_FORM_AUTOFILLED_NONE);
945    }
946
947    // Unlike the other times, the |submission_time| should always be available.
948    DCHECK(!submission_time.is_null());
949
950    // The |load_time| might be unset, in the case that the form was dynamically
951    // added to the DOM.
952    if (!load_time.is_null()) {
953      // Submission should always chronologically follow form load.
954      DCHECK(submission_time > load_time);
955      base::TimeDelta elapsed = submission_time - load_time;
956      if (did_autofill_some_possible_fields)
957        metric_logger.LogFormFillDurationFromLoadWithAutofill(elapsed);
958      else
959        metric_logger.LogFormFillDurationFromLoadWithoutAutofill(elapsed);
960    }
961
962    // The |interaction_time| might be unset, in the case that the user
963    // submitted a blank form.
964    if (!interaction_time.is_null()) {
965      // Submission should always chronologically follow interaction.
966      DCHECK(submission_time > interaction_time);
967      base::TimeDelta elapsed = submission_time - interaction_time;
968      if (did_autofill_some_possible_fields) {
969        metric_logger.LogFormFillDurationFromInteractionWithAutofill(elapsed);
970      } else {
971        metric_logger.LogFormFillDurationFromInteractionWithoutAutofill(
972            elapsed);
973      }
974    }
975  }
976}
977
978const AutofillField* FormStructure::field(size_t index) const {
979  if (index >= fields_.size()) {
980    NOTREACHED();
981    return NULL;
982  }
983
984  return fields_[index];
985}
986
987AutofillField* FormStructure::field(size_t index) {
988  return const_cast<AutofillField*>(
989      static_cast<const FormStructure*>(this)->field(index));
990}
991
992size_t FormStructure::field_count() const {
993  return fields_.size();
994}
995
996size_t FormStructure::active_field_count() const {
997  return active_field_count_;
998}
999
1000std::string FormStructure::server_experiment_id() const {
1001  return server_experiment_id_;
1002}
1003
1004FormData FormStructure::ToFormData() const {
1005  // |data.user_submitted| will always be false.
1006  FormData data;
1007  data.name = form_name_;
1008  data.origin = source_url_;
1009  data.action = target_url_;
1010  data.method = ASCIIToUTF16(method_ == POST ? "POST" : "GET");
1011
1012  for (size_t i = 0; i < fields_.size(); ++i) {
1013    data.fields.push_back(FormFieldData(*fields_[i]));
1014  }
1015
1016  return data;
1017}
1018
1019bool FormStructure::operator==(const FormData& form) const {
1020  // TODO(jhawkins): Is this enough to differentiate a form?
1021  if (form_name_ == form.name &&
1022      source_url_ == form.origin &&
1023      target_url_ == form.action) {
1024    return true;
1025  }
1026
1027  // TODO(jhawkins): Compare field names, IDs and labels once we have labels
1028  // set up.
1029
1030  return false;
1031}
1032
1033bool FormStructure::operator!=(const FormData& form) const {
1034  return !operator==(form);
1035}
1036
1037std::string FormStructure::Hash64Bit(const std::string& str) {
1038  std::string hash_bin = base::SHA1HashString(str);
1039  DCHECK_EQ(20U, hash_bin.length());
1040
1041  uint64 hash64 = (((static_cast<uint64>(hash_bin[0])) & 0xFF) << 56) |
1042                  (((static_cast<uint64>(hash_bin[1])) & 0xFF) << 48) |
1043                  (((static_cast<uint64>(hash_bin[2])) & 0xFF) << 40) |
1044                  (((static_cast<uint64>(hash_bin[3])) & 0xFF) << 32) |
1045                  (((static_cast<uint64>(hash_bin[4])) & 0xFF) << 24) |
1046                  (((static_cast<uint64>(hash_bin[5])) & 0xFF) << 16) |
1047                  (((static_cast<uint64>(hash_bin[6])) & 0xFF) << 8) |
1048                   ((static_cast<uint64>(hash_bin[7])) & 0xFF);
1049
1050  return base::Uint64ToString(hash64);
1051}
1052
1053bool FormStructure::EncodeFormRequest(
1054    FormStructure::EncodeRequestType request_type,
1055    buzz::XmlElement* encompassing_xml_element) const {
1056  if (!field_count())  // Nothing to add.
1057    return false;
1058
1059  // Some badly formatted web sites repeat fields - limit number of fields to
1060  // 48, which is far larger than any valid form and XML still fits into 2K.
1061  // Do not send requests for forms with more than this many fields, as they are
1062  // near certainly not valid/auto-fillable.
1063  const size_t kMaxFieldsOnTheForm = 48;
1064  if (field_count() > kMaxFieldsOnTheForm)
1065    return false;
1066
1067  // Add the child nodes for the form fields.
1068  for (size_t index = 0; index < field_count(); ++index) {
1069    const AutofillField* field = fields_[index];
1070    switch (request_type) {
1071      case FormStructure::UPLOAD:
1072        EncodeFieldForUpload(*field, encompassing_xml_element);
1073        break;
1074      case FormStructure::QUERY:
1075        if (ShouldSkipField(*field))
1076          continue;
1077        EncodeFieldForQuery(*field, encompassing_xml_element);
1078        break;
1079      case FormStructure::FIELD_ASSIGNMENTS:
1080        EncodeFieldForFieldAssignments(*field, encompassing_xml_element);
1081        break;
1082    }
1083  }
1084  return true;
1085}
1086
1087void FormStructure::ParseFieldTypesFromAutocompleteAttributes(
1088    bool* found_types,
1089    bool* found_sections) {
1090  const std::string kDefaultSection = "-default";
1091
1092  *found_types = false;
1093  *found_sections = false;
1094  for (std::vector<AutofillField*>::iterator it = fields_.begin();
1095       it != fields_.end(); ++it) {
1096    AutofillField* field = *it;
1097
1098    // To prevent potential section name collisions, add a default suffix for
1099    // other fields.  Without this, 'autocomplete' attribute values
1100    // "section--shipping street-address" and "shipping street-address" would be
1101    // parsed identically, given the section handling code below.  We do this
1102    // before any validation so that fields with invalid attributes still end up
1103    // in the default section.  These default section names will be overridden
1104    // by subsequent heuristic parsing steps if there are no author-specified
1105    // section names.
1106    field->set_section(kDefaultSection);
1107
1108    // Canonicalize the attribute value by trimming whitespace, collapsing
1109    // non-space characters (e.g. tab) to spaces, and converting to lowercase.
1110    std::string autocomplete_attribute =
1111        CollapseWhitespaceASCII(field->autocomplete_attribute, false);
1112    autocomplete_attribute = StringToLowerASCII(autocomplete_attribute);
1113
1114    // The autocomplete attribute is overloaded: it can specify either a field
1115    // type hint or whether autocomplete should be enabled at all.  Ignore the
1116    // latter type of attribute value.
1117    if (autocomplete_attribute.empty() ||
1118        autocomplete_attribute == "on" ||
1119        autocomplete_attribute == "off") {
1120      continue;
1121    }
1122
1123    // Any other value, even it is invalid, is considered to be a type hint.
1124    // This allows a website's author to specify an attribute like
1125    // autocomplete="other" on a field to disable all Autofill heuristics for
1126    // the form.
1127    *found_types = true;
1128
1129    // Tokenize the attribute value.  Per the spec, the tokens are parsed in
1130    // reverse order.
1131    std::vector<std::string> tokens;
1132    Tokenize(autocomplete_attribute, " ", &tokens);
1133
1134    // The final token must be the field type.
1135    // If it is not one of the known types, abort.
1136    DCHECK(!tokens.empty());
1137    std::string field_type_token = tokens.back();
1138    tokens.pop_back();
1139    HtmlFieldType field_type =
1140        FieldTypeFromAutocompleteAttributeValue(field_type_token, *field);
1141    if (field_type == HTML_TYPE_UNKNOWN)
1142      continue;
1143
1144    // The preceding token, if any, may be a type hint.
1145    if (!tokens.empty() && IsContactTypeHint(tokens.back())) {
1146      // If it is, it must match the field type; otherwise, abort.
1147      // Note that an invalid token invalidates the entire attribute value, even
1148      // if the other tokens are valid.
1149      if (!ContactTypeHintMatchesFieldType(tokens.back(), field_type))
1150        continue;
1151
1152      // Chrome Autofill ignores these type hints.
1153      tokens.pop_back();
1154    }
1155
1156    // The preceding token, if any, may be a fixed string that is either
1157    // "shipping" or "billing".  Chrome Autofill treats these as implicit
1158    // section name suffixes.
1159    DCHECK_EQ(kDefaultSection, field->section());
1160    std::string section = field->section();
1161    HtmlFieldMode mode = HTML_MODE_NONE;
1162    if (!tokens.empty()) {
1163      if (tokens.back() == kShippingMode)
1164        mode = HTML_MODE_SHIPPING;
1165      else if (tokens.back() == kBillingMode)
1166        mode = HTML_MODE_BILLING;
1167    }
1168
1169    if (mode != HTML_MODE_NONE) {
1170      section = "-" + tokens.back();
1171      tokens.pop_back();
1172    }
1173
1174    // The preceding token, if any, may be a named section.
1175    const std::string kSectionPrefix = "section-";
1176    if (!tokens.empty() &&
1177        StartsWithASCII(tokens.back(), kSectionPrefix, true)) {
1178      // Prepend this section name to the suffix set in the preceding block.
1179      section = tokens.back().substr(kSectionPrefix.size()) + section;
1180      tokens.pop_back();
1181    }
1182
1183    // No other tokens are allowed.  If there are any remaining, abort.
1184    if (!tokens.empty())
1185      continue;
1186
1187    if (section != kDefaultSection) {
1188      *found_sections = true;
1189      field->set_section(section);
1190    }
1191
1192    // No errors encountered while parsing!
1193    // Update the |field|'s type based on what was parsed from the attribute.
1194    field->SetHtmlType(field_type, mode);
1195  }
1196}
1197
1198void FormStructure::IdentifySections(bool has_author_specified_sections) {
1199  if (fields_.empty())
1200    return;
1201
1202  if (!has_author_specified_sections) {
1203    // Name sections after the first field in the section.
1204    base::string16 current_section = fields_.front()->unique_name();
1205
1206    // Keep track of the types we've seen in this section.
1207    std::set<ServerFieldType> seen_types;
1208    ServerFieldType previous_type = UNKNOWN_TYPE;
1209
1210    for (std::vector<AutofillField*>::iterator field = fields_.begin();
1211         field != fields_.end(); ++field) {
1212      const ServerFieldType current_type = (*field)->Type().GetStorableType();
1213
1214      bool already_saw_current_type = seen_types.count(current_type) > 0;
1215
1216      // Forms often ask for multiple phone numbers -- e.g. both a daytime and
1217      // evening phone number.  Our phone number detection is also generally a
1218      // little off.  Hence, ignore this field type as a signal here.
1219      if (AutofillType(current_type).group() == PHONE_HOME)
1220        already_saw_current_type = false;
1221
1222      // Some forms have adjacent fields of the same type.  Two common examples:
1223      //  * Forms with two email fields, where the second is meant to "confirm"
1224      //    the first.
1225      //  * Forms with a <select> menu for states in some countries, and a
1226      //    freeform <input> field for states in other countries.  (Usually,
1227      //    only one of these two will be visible for any given choice of
1228      //    country.)
1229      // Generally, adjacent fields of the same type belong in the same logical
1230      // section.
1231      if (current_type == previous_type)
1232        already_saw_current_type = false;
1233
1234      previous_type = current_type;
1235
1236      if (current_type != UNKNOWN_TYPE && already_saw_current_type) {
1237        // We reached the end of a section, so start a new section.
1238        seen_types.clear();
1239        current_section = (*field)->unique_name();
1240      }
1241
1242      seen_types.insert(current_type);
1243      (*field)->set_section(UTF16ToUTF8(current_section));
1244    }
1245  }
1246
1247  // Ensure that credit card and address fields are in separate sections.
1248  // This simplifies the section-aware logic in autofill_manager.cc.
1249  for (std::vector<AutofillField*>::iterator field = fields_.begin();
1250       field != fields_.end(); ++field) {
1251    FieldTypeGroup field_type_group = (*field)->Type().group();
1252    if (field_type_group == CREDIT_CARD)
1253      (*field)->set_section((*field)->section() + "-cc");
1254    else
1255      (*field)->set_section((*field)->section() + "-default");
1256  }
1257}
1258
1259}  // namespace autofill
1260