1 /*
2 * Copyright (C) 2009 Google Inc. All rights reserved.
3 *
4 * Redistribution and use in source and binary forms, with or without
5 * modification, are permitted provided that the following conditions are
6 * met:
7 *
8 * * Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
10 * * Redistributions in binary form must reproduce the above
11 * copyright notice, this list of conditions and the following disclaimer
12 * in the documentation and/or other materials provided with the
13 * distribution.
14 * * Neither the name of Google Inc. nor the names of its
15 * contributors may be used to endorse or promote products derived from
16 * this software without specific prior written permission.
17 *
18 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
19 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
20 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
21 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
22 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
23 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
24 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
25 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
26 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
27 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
28 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 */
30
31 #include "config.h"
32 #include "WebSearchableFormData.h"
33
34 #include "HTMLNames.h"
35 #include "WebFormElement.h"
36 #include "WebInputElement.h"
37 #include "core/dom/Document.h"
38 #include "core/html/FormDataList.h"
39 #include "core/html/HTMLFormControlElement.h"
40 #include "core/html/HTMLFormElement.h"
41 #include "core/html/HTMLInputElement.h"
42 #include "core/html/HTMLOptionElement.h"
43 #include "core/html/HTMLSelectElement.h"
44 #include "core/html/HTMLTextAreaElement.h"
45 #include "platform/network/FormDataBuilder.h"
46 #include "wtf/text/TextEncoding.h"
47
48 using namespace WebCore;
49 using namespace HTMLNames;
50
51 namespace {
52
53 // Gets the encoding for the form.
GetFormEncoding(const HTMLFormElement * form,WTF::TextEncoding * encoding)54 void GetFormEncoding(const HTMLFormElement* form, WTF::TextEncoding* encoding)
55 {
56 String str(form->getAttribute(HTMLNames::accept_charsetAttr));
57 str.replace(',', ' ');
58 Vector<String> charsets;
59 str.split(' ', charsets);
60 for (Vector<String>::const_iterator i(charsets.begin()); i != charsets.end(); ++i) {
61 *encoding = WTF::TextEncoding(*i);
62 if (encoding->isValid())
63 return;
64 }
65 if (!form->document().loader())
66 return;
67 *encoding = WTF::TextEncoding(form->document().encoding());
68 }
69
70 // Returns true if the submit request results in an HTTP URL.
IsHTTPFormSubmit(const HTMLFormElement * form)71 bool IsHTTPFormSubmit(const HTMLFormElement* form)
72 {
73 // FIXME: This function is insane. This is an overly complicated way to get this information.
74 String action(form->action());
75 // The isNull() check is trying to avoid completeURL returning KURL() when passed a null string.
76 return form->document().completeURL(action.isNull() ? "" : action).protocolIs("http");
77 }
78
79 // If the form does not have an activated submit button, the first submit
80 // button is returned.
GetButtonToActivate(HTMLFormElement * form)81 HTMLFormControlElement* GetButtonToActivate(HTMLFormElement* form)
82 {
83 HTMLFormControlElement* firstSubmitButton = 0;
84 const Vector<FormAssociatedElement*>& element = form->associatedElements();
85 for (Vector<FormAssociatedElement*>::const_iterator i(element.begin()); i != element.end(); ++i) {
86 if (!(*i)->isFormControlElement())
87 continue;
88 HTMLFormControlElement* control = toHTMLFormControlElement(*i);
89 if (control->isActivatedSubmit()) {
90 // There's a button that is already activated for submit, return 0.
91 return 0;
92 }
93 if (!firstSubmitButton && control->isSuccessfulSubmitButton())
94 firstSubmitButton = control;
95 }
96 return firstSubmitButton;
97 }
98
99 // Returns true if the selected state of all the options matches the default
100 // selected state.
IsSelectInDefaultState(HTMLSelectElement * select)101 bool IsSelectInDefaultState(HTMLSelectElement* select)
102 {
103 const Vector<HTMLElement*>& listItems = select->listItems();
104 if (select->multiple() || select->size() > 1) {
105 for (Vector<HTMLElement*>::const_iterator i(listItems.begin()); i != listItems.end(); ++i) {
106 if (!(*i)->hasLocalName(HTMLNames::optionTag))
107 continue;
108 HTMLOptionElement* optionElement = toHTMLOptionElement(*i);
109 if (optionElement->selected() != optionElement->hasAttribute(selectedAttr))
110 return false;
111 }
112 return true;
113 }
114
115 // The select is rendered as a combobox (called menulist in WebKit). At
116 // least one item is selected, determine which one.
117 HTMLOptionElement* initialSelected = 0;
118 for (Vector<HTMLElement*>::const_iterator i(listItems.begin()); i != listItems.end(); ++i) {
119 if (!(*i)->hasLocalName(HTMLNames::optionTag))
120 continue;
121 HTMLOptionElement* optionElement = toHTMLOptionElement(*i);
122 if (optionElement->hasAttribute(selectedAttr)) {
123 // The page specified the option to select.
124 initialSelected = optionElement;
125 break;
126 }
127 if (!initialSelected)
128 initialSelected = optionElement;
129 }
130 return !initialSelected || initialSelected->selected();
131 }
132
133 // Returns true if the form element is in its default state, false otherwise.
134 // The default state is the state of the form element on initial load of the
135 // page, and varies depending upon the form element. For example, a checkbox is
136 // in its default state if the checked state matches the state of the checked attribute.
IsInDefaultState(HTMLFormControlElement * formElement)137 bool IsInDefaultState(HTMLFormControlElement* formElement)
138 {
139 if (formElement->hasTagName(HTMLNames::inputTag)) {
140 const HTMLInputElement* inputElement = toHTMLInputElement(formElement);
141 if (inputElement->isCheckbox() || inputElement->isRadioButton())
142 return inputElement->checked() == inputElement->hasAttribute(checkedAttr);
143 } else if (formElement->hasTagName(HTMLNames::selectTag)) {
144 return IsSelectInDefaultState(toHTMLSelectElement(formElement));
145 }
146 return true;
147 }
148
149 // Look for a suitable search text field in a given HTMLFormElement
150 // Return nothing if one of those items are found:
151 // - A text area field
152 // - A file upload field
153 // - A Password field
154 // - More than one text field
findSuitableSearchInputElement(const HTMLFormElement * form)155 HTMLInputElement* findSuitableSearchInputElement(const HTMLFormElement* form)
156 {
157 HTMLInputElement* textElement = 0;
158 const Vector<FormAssociatedElement*>& element = form->associatedElements();
159 for (Vector<FormAssociatedElement*>::const_iterator i(element.begin()); i != element.end(); ++i) {
160 if (!(*i)->isFormControlElement())
161 continue;
162
163 HTMLFormControlElement* control = toHTMLFormControlElement(*i);
164
165 if (control->isDisabledFormControl() || control->name().isNull())
166 continue;
167
168 if (!IsInDefaultState(control) || isHTMLTextAreaElement(control))
169 return 0;
170
171 if (control->hasTagName(HTMLNames::inputTag) && control->willValidate()) {
172 const HTMLInputElement* input = toHTMLInputElement(control);
173
174 // Return nothing if a file upload field or a password field are found.
175 if (input->isFileUpload() || input->isPasswordField())
176 return 0;
177
178 if (input->isTextField()) {
179 if (textElement) {
180 // The auto-complete bar only knows how to fill in one value.
181 // This form has multiple fields; don't treat it as searchable.
182 return 0;
183 }
184 textElement = toHTMLInputElement(control);
185 }
186 }
187 }
188 return textElement;
189 }
190
191 // Build a search string based on a given HTMLFormElement and HTMLInputElement
192 //
193 // Search string output example from www.google.com:
194 // "hl=en&source=hp&biw=1085&bih=854&q={searchTerms}&btnG=Google+Search&aq=f&aqi=&aql=&oq="
195 //
196 // Return false if the provided HTMLInputElement is not found in the form
buildSearchString(const HTMLFormElement * form,Vector<char> * encodedString,WTF::TextEncoding * encoding,const HTMLInputElement * textElement)197 bool buildSearchString(const HTMLFormElement* form, Vector<char>* encodedString, WTF::TextEncoding* encoding, const HTMLInputElement* textElement)
198 {
199 bool isElementFound = false;
200
201 Vector<FormAssociatedElement*> elements = form->associatedElements();
202 for (Vector<FormAssociatedElement*>::const_iterator i(elements.begin()); i != elements.end(); ++i) {
203 if (!(*i)->isFormControlElement())
204 continue;
205
206 HTMLFormControlElement* control = toHTMLFormControlElement(*i);
207
208 if (control->isDisabledFormControl() || control->name().isNull())
209 continue;
210
211 FormDataList dataList(*encoding);
212 if (!control->appendFormData(dataList, false))
213 continue;
214
215 const Vector<FormDataList::Item>& items = dataList.items();
216
217 for (Vector<FormDataList::Item>::const_iterator j(items.begin()); j != items.end(); ++j) {
218 // Handle ISINDEX / <input name=isindex> specially, but only if it's
219 // the first entry.
220 if (!encodedString->isEmpty() || j->data() != "isindex") {
221 if (!encodedString->isEmpty())
222 encodedString->append('&');
223 FormDataBuilder::encodeStringAsFormData(*encodedString, j->data());
224 encodedString->append('=');
225 }
226 ++j;
227 if (control == textElement) {
228 encodedString->append("{searchTerms}", 13);
229 isElementFound = true;
230 } else
231 FormDataBuilder::encodeStringAsFormData(*encodedString, j->data());
232 }
233 }
234 return isElementFound;
235 }
236 } // namespace
237
238 namespace blink {
239
WebSearchableFormData(const WebFormElement & form,const WebInputElement & selectedInputElement)240 WebSearchableFormData::WebSearchableFormData(const WebFormElement& form, const WebInputElement& selectedInputElement)
241 {
242 RefPtr<HTMLFormElement> formElement = form.operator PassRefPtr<HTMLFormElement>();
243 HTMLInputElement* inputElement = selectedInputElement.operator PassRefPtr<HTMLInputElement>().get();
244
245 // Only consider forms that GET data.
246 // Allow HTTPS only when an input element is provided.
247 if (equalIgnoringCase(formElement->getAttribute(methodAttr), "post")
248 || (!IsHTTPFormSubmit(formElement.get()) && !inputElement))
249 return;
250
251 Vector<char> encodedString;
252 WTF::TextEncoding encoding;
253
254 GetFormEncoding(formElement.get(), &encoding);
255 if (!encoding.isValid()) {
256 // Need a valid encoding to encode the form elements.
257 // If the encoding isn't found webkit ends up replacing the params with
258 // empty strings. So, we don't try to do anything here.
259 return;
260 }
261
262 // Look for a suitable search text field in the form when a
263 // selectedInputElement is not provided.
264 if (!inputElement) {
265 inputElement = findSuitableSearchInputElement(formElement.get());
266
267 // Return if no suitable text element has been found.
268 if (!inputElement)
269 return;
270 }
271
272 HTMLFormControlElement* firstSubmitButton = GetButtonToActivate(formElement.get());
273 if (firstSubmitButton) {
274 // The form does not have an active submit button, make the first button
275 // active. We need to do this, otherwise the URL will not contain the
276 // name of the submit button.
277 firstSubmitButton->setActivatedSubmit(true);
278 }
279
280 bool isValidSearchString = buildSearchString(formElement.get(), &encodedString, &encoding, inputElement);
281
282 if (firstSubmitButton)
283 firstSubmitButton->setActivatedSubmit(false);
284
285 // Return if the search string is not valid.
286 if (!isValidSearchString)
287 return;
288
289 String action(formElement->action());
290 KURL url(formElement->document().completeURL(action.isNull() ? "" : action));
291 RefPtr<FormData> formData = FormData::create(encodedString);
292 url.setQuery(formData->flattenToString());
293 m_url = url;
294 m_encoding = String(encoding.name());
295 }
296
297 } // namespace blink
298