1// Copyright 2013 The Chromium Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
4
5#ifndef COMPONENTS_AUTOFILL_CORE_BROWSER_FORM_STRUCTURE_H_
6#define COMPONENTS_AUTOFILL_CORE_BROWSER_FORM_STRUCTURE_H_
7
8#include <string>
9#include <vector>
10
11#include "base/gtest_prod_util.h"
12#include "base/memory/scoped_ptr.h"
13#include "base/memory/scoped_vector.h"
14#include "components/autofill/core/browser/autofill_field.h"
15#include "components/autofill/core/browser/autofill_type.h"
16#include "components/autofill/core/browser/field_types.h"
17#include "components/autofill/core/common/web_element_descriptor.h"
18#include "url/gurl.h"
19
20enum RequestMethod {
21  GET,
22  POST
23};
24
25enum UploadRequired {
26  UPLOAD_NOT_REQUIRED,
27  UPLOAD_REQUIRED,
28  USE_UPLOAD_RATES
29};
30
31namespace base {
32class TimeTicks;
33}
34
35namespace buzz {
36class XmlElement;
37}
38
39namespace autofill {
40
41class AutofillMetrics;
42
43struct AutocheckoutPageMetaData;
44struct FormData;
45struct FormDataPredictions;
46
47// FormStructure stores a single HTML form together with the values entered
48// in the fields along with additional information needed by Autofill.
49class FormStructure {
50 public:
51  FormStructure(const FormData& form,
52                const std::string& autocheckout_url_prefix);
53  virtual ~FormStructure();
54
55  // Runs several heuristics against the form fields to determine their possible
56  // types.
57  void DetermineHeuristicTypes(const AutofillMetrics& metric_logger);
58
59  // Encodes the XML upload request from this FormStructure.
60  bool EncodeUploadRequest(const ServerFieldTypeSet& available_field_types,
61                           bool form_was_autofilled,
62                           std::string* encoded_xml) const;
63
64  // Encodes a XML block contains autofill field type from this FormStructure.
65  // This XML will be written VLOG only, never be sent to server. It will
66  // help make FieldAssignments and feed back to autofill server as
67  // experiment data.
68  bool EncodeFieldAssignments(const ServerFieldTypeSet& available_field_types,
69                              std::string* encoded_xml) const;
70
71  // Encodes the XML query request for the set of forms.
72  // All fields are returned in one XML. For example, there are three forms,
73  // with 2, 4, and 3 fields. The returned XML would have type info for 9
74  // fields, first two of which would be for the first form, next 4 for the
75  // second, and the rest is for the third.
76  static bool EncodeQueryRequest(const std::vector<FormStructure*>& forms,
77                                 std::vector<std::string>* encoded_signatures,
78                                 std::string* encoded_xml);
79
80  // Parses the field types from the server query response. |forms| must be the
81  // same as the one passed to EncodeQueryRequest when constructing the query.
82  static void ParseQueryResponse(
83      const std::string& response_xml,
84      const std::vector<FormStructure*>& forms,
85      autofill::AutocheckoutPageMetaData* page_meta_data,
86      const AutofillMetrics& metric_logger);
87
88  // Fills |forms| with the details from the given |form_structures| and their
89  // fields' predicted types.
90  static void GetFieldTypePredictions(
91      const std::vector<FormStructure*>& form_structures,
92      std::vector<FormDataPredictions>* forms);
93
94  // The unique signature for this form, composed of the target url domain,
95  // the form name, and the form field names in a 64-bit hash.
96  std::string FormSignature() const;
97
98  // Runs a quick heuristic to rule out forms that are obviously not
99  // auto-fillable, like google/yahoo/msn search, etc. The requirement that the
100  // form's method be POST is only applied if |require_method_post| is true.
101  bool IsAutofillable(bool require_method_post) const;
102
103  // Resets |autofill_count_| and counts the number of auto-fillable fields.
104  // This is used when we receive server data for form fields.  At that time,
105  // we may have more known fields than just the number of fields we matched
106  // heuristically.
107  void UpdateAutofillCount();
108
109  // Returns true if this form matches the structural requirements for Autofill.
110  // The requirement that the form's method be POST is only applied if
111  // |require_method_post| is true.
112  bool ShouldBeParsed(bool require_method_post) const;
113
114  // Returns true if we should query the crowdsourcing server to determine this
115  // form's field types.  If the form includes author-specified types, this will
116  // return false.
117  bool ShouldBeCrowdsourced() const;
118
119  // Sets the field types and experiment id to be those set for |cached_form|.
120  void UpdateFromCache(const FormStructure& cached_form);
121
122  // Logs quality metrics for |this|, which should be a user-submitted form.
123  // This method should only be called after the possible field types have been
124  // set for each field.  |interaction_time| should be a timestamp corresponding
125  // to the user's first interaction with the form.  |submission_time| should be
126  // a timestamp corresponding to the form's submission.
127  void LogQualityMetrics(const AutofillMetrics& metric_logger,
128                         const base::TimeTicks& load_time,
129                         const base::TimeTicks& interaction_time,
130                         const base::TimeTicks& submission_time) const;
131
132  // Classifies each field in |fields_| based upon its |autocomplete| attribute,
133  // if the attribute is available.  The association is stored into the field's
134  // |heuristic_type|.
135  // Fills |found_types| with |true| if the attribute is available and neither
136  // empty nor set to the special values "on" or "off" for at least one field.
137  // Fills |found_sections| with |true| if the attribute specifies a section for
138  // at least one field.
139  void ParseFieldTypesFromAutocompleteAttributes(bool* found_types,
140                                                 bool* found_sections);
141
142  const AutofillField* field(size_t index) const;
143  AutofillField* field(size_t index);
144  size_t field_count() const;
145
146  // Returns the number of fields that are able to be autofilled.
147  size_t autofill_count() const { return autofill_count_; }
148
149  // Used for iterating over the fields.
150  std::vector<AutofillField*>::const_iterator begin() const {
151    return fields_.begin();
152  }
153  std::vector<AutofillField*>::const_iterator end() const {
154    return fields_.end();
155  }
156
157  const GURL& source_url() const { return source_url_; }
158
159  UploadRequired upload_required() const { return upload_required_; }
160
161  virtual std::string server_experiment_id() const;
162
163  // Returns a FormData containing the data this form structure knows about.
164  // |user_submitted| is currently always false.
165  FormData ToFormData() const;
166
167  bool filled_by_autocheckout() const { return filled_by_autocheckout_; }
168  void set_filled_by_autocheckout(bool filled_by_autocheckout) {
169    filled_by_autocheckout_ = filled_by_autocheckout;
170  }
171
172  bool operator==(const FormData& form) const;
173  bool operator!=(const FormData& form) const;
174
175 private:
176  friend class FormStructureTest;
177  FRIEND_TEST_ALL_PREFIXES(AutofillDownloadTest, QueryAndUploadTest);
178
179  // 64-bit hash of the string - used in FormSignature and unit-tests.
180  static std::string Hash64Bit(const std::string& str);
181
182  enum EncodeRequestType {
183    QUERY,
184    UPLOAD,
185    FIELD_ASSIGNMENTS,
186  };
187
188  // Adds form info to |encompassing_xml_element|. |request_type| indicates if
189  // it is a query or upload.
190  bool EncodeFormRequest(EncodeRequestType request_type,
191                         buzz::XmlElement* encompassing_xml_element) const;
192
193  // Classifies each field in |fields_| into a logical section.
194  // Sections are identified by the heuristic that a logical section should not
195  // include multiple fields of the same autofill type (with some exceptions, as
196  // described in the implementation).  Sections are furthermore distinguished
197  // as either credit card or non-credit card sections.
198  // If |has_author_specified_sections| is true, only the second pass --
199  // distinguishing credit card sections from non-credit card ones -- is made.
200  void IdentifySections(bool has_author_specified_sections);
201
202  bool IsAutocheckoutEnabled() const;
203
204  // Returns true if field should be skipped when talking to Autofill server.
205  bool ShouldSkipField(const FormFieldData& field) const;
206
207  // Returns the minimal number of fillable fields required to start autofill.
208  size_t RequiredFillableFields() const;
209  size_t active_field_count() const;
210
211  // The name of the form.
212  base::string16 form_name_;
213
214  // The source URL.
215  GURL source_url_;
216
217  // The target URL.
218  GURL target_url_;
219
220  // The number of fields able to be auto-filled.
221  size_t autofill_count_;
222
223  // A vector of all the input fields in the form.
224  ScopedVector<AutofillField> fields_;
225
226  // The number of fields counted towards form signature and request to Autofill
227  // server.
228  size_t active_field_count_;
229
230  // The names of the form input elements, that are part of the form signature.
231  // The string starts with "&" and the names are also separated by the "&"
232  // character. E.g.: "&form_input1_name&form_input2_name&...&form_inputN_name"
233  std::string form_signature_field_names_;
234
235  // Whether the server expects us to always upload, never upload, or default
236  // to the stored upload rates.
237  UploadRequired upload_required_;
238
239  // The server experiment corresponding to the server types returned for this
240  // form.
241  std::string server_experiment_id_;
242
243  // GET or POST.
244  RequestMethod method_;
245
246  // Whether the form includes any field types explicitly specified by the site
247  // author, via the |autocompletetype| attribute.
248  bool has_author_specified_types_;
249
250  // The URL prefix matched in autocheckout whitelist. An empty string implies
251  // autocheckout is not enabled for this form.
252  std::string autocheckout_url_prefix_;
253
254  // Whether or not this form was filled by Autocheckout.
255  bool filled_by_autocheckout_;
256
257  DISALLOW_COPY_AND_ASSIGN(FormStructure);
258};
259
260}  // namespace autofill
261
262#endif  // COMPONENTS_AUTOFILL_CORE_BROWSER_FORM_STRUCTURE_H_
263