1 // Copyright 2014 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
5 #include "components/search_engines/template_url.h"
10 #include "base/basictypes.h"
11 #include "base/command_line.h"
12 #include "base/format_macros.h"
13 #include "base/i18n/icu_string_conversions.h"
14 #include "base/i18n/rtl.h"
15 #include "base/logging.h"
16 #include "base/metrics/field_trial.h"
17 #include "base/rand_util.h"
18 #include "base/strings/string_number_conversions.h"
19 #include "base/strings/string_piece.h"
20 #include "base/strings/string_split.h"
21 #include "base/strings/string_util.h"
22 #include "base/strings/stringprintf.h"
23 #include "base/strings/utf_string_conversions.h"
24 #include "components/google/core/browser/google_util.h"
25 #include "components/metrics/proto/omnibox_input_type.pb.h"
26 #include "components/search_engines/search_engines_switches.h"
27 #include "components/search_engines/search_terms_data.h"
28 #include "components/url_formatter/url_formatter.h"
29 #include "google_apis/google_api_keys.h"
30 #include "net/base/escape.h"
31 #include "net/base/mime_util.h"
32 #include "net/base/net_util.h"
33 #include "ui/base/device_form_factor.h"
38 // The TemplateURLRef has any number of terms that need to be replaced. Each of
39 // the terms is enclosed in braces. If the character preceeding the final
40 // brace is a ?, it indicates the term is optional and can be replaced with
42 const char kStartParameter
= '{';
43 const char kEndParameter
= '}';
44 const char kOptional
= '?';
46 // Known parameters found in the URL.
47 const char kSearchTermsParameter
[] = "searchTerms";
48 const char kSearchTermsParameterFull
[] = "{searchTerms}";
49 const char kSearchTermsParameterFullEscaped
[] = "%7BsearchTerms%7D";
51 // Same as kSearchTermsParameter, with no escaping.
52 const char kGoogleUnescapedSearchTermsParameter
[] =
53 "google:unescapedSearchTerms";
54 const char kGoogleUnescapedSearchTermsParameterFull
[] =
55 "{google:unescapedSearchTerms}";
57 // Display value for kSearchTermsParameter.
58 const char kDisplaySearchTerms
[] = "%s";
60 // Display value for kGoogleUnescapedSearchTermsParameter.
61 const char kDisplayUnescapedSearchTerms
[] = "%S";
63 // Used if the count parameter is not optional. Indicates we want 10 search
65 const char kDefaultCount
[] = "10";
67 // Used if the output encoding parameter is required.
68 const char kOutputEncodingType
[] = "UTF-8";
70 // Attempts to encode |terms| and |original_query| in |encoding| and escape
71 // them. |terms| may be escaped as path or query depending on |is_in_query|;
72 // |original_query| is always escaped as query. Returns whether the encoding
74 bool TryEncoding(const base::string16
& terms
,
75 const base::string16
& original_query
,
78 base::string16
* escaped_terms
,
79 base::string16
* escaped_original_query
) {
80 DCHECK(escaped_terms
);
81 DCHECK(escaped_original_query
);
82 std::string encoded_terms
;
83 if (!base::UTF16ToCodepage(terms
, encoding
,
84 base::OnStringConversionError::SKIP
, &encoded_terms
))
86 *escaped_terms
= base::UTF8ToUTF16(is_in_query
?
87 net::EscapeQueryParamValue(encoded_terms
, true) :
88 net::EscapePath(encoded_terms
));
89 if (original_query
.empty())
91 std::string encoded_original_query
;
92 if (!base::UTF16ToCodepage(original_query
, encoding
,
93 base::OnStringConversionError::SKIP
, &encoded_original_query
))
95 *escaped_original_query
= base::UTF8ToUTF16(
96 net::EscapeQueryParamValue(encoded_original_query
, true));
100 // Extract query key and host given a list of parameters coming from the URL
102 std::string
FindSearchTermsKey(const std::string
& params
) {
104 return std::string();
105 url::Component query
, key
, value
;
106 query
.len
= static_cast<int>(params
.size());
107 while (url::ExtractQueryKeyValue(params
.c_str(), &query
, &key
, &value
)) {
108 if (key
.is_nonempty() && value
.is_nonempty()) {
109 const base::StringPiece
value_string(params
.c_str() + value
.begin
,
111 if (value_string
.find(kSearchTermsParameterFull
, 0) !=
112 base::StringPiece::npos
||
113 value_string
.find(kGoogleUnescapedSearchTermsParameterFull
, 0) !=
114 base::StringPiece::npos
) {
115 return params
.substr(key
.begin
, key
.len
);
119 return std::string();
122 // Extract the position of the search terms' parameter in the URL path.
123 bool FindSearchTermsInPath(const std::string
& path
,
124 url::Component
* parameter_position
) {
125 DCHECK(parameter_position
);
126 parameter_position
->reset();
127 const size_t begin
= path
.find(kSearchTermsParameterFullEscaped
);
128 if (begin
== std::string::npos
)
130 parameter_position
->begin
= begin
;
131 parameter_position
->len
= arraysize(kSearchTermsParameterFullEscaped
) - 1;
135 bool IsTemplateParameterString(const std::string
& param
) {
136 return (param
.length() > 2) && (*(param
.begin()) == kStartParameter
) &&
137 (*(param
.rbegin()) == kEndParameter
);
143 // TemplateURLRef::SearchTermsArgs --------------------------------------------
145 TemplateURLRef::SearchTermsArgs::SearchTermsArgs(
146 const base::string16
& search_terms
)
147 : search_terms(search_terms
),
148 input_type(metrics::OmniboxInputType::INVALID
),
149 accepted_suggestion(NO_SUGGESTIONS_AVAILABLE
),
150 cursor_position(base::string16::npos
),
151 enable_omnibox_start_margin(false),
152 page_classification(metrics::OmniboxEventProto::INVALID_SPEC
),
153 bookmark_bar_pinned(false),
154 append_extra_query_params(false),
155 force_instant_results(false),
156 from_app_list(false),
157 contextual_search_params(ContextualSearchParams()) {
160 TemplateURLRef::SearchTermsArgs::~SearchTermsArgs() {
163 TemplateURLRef::SearchTermsArgs::ContextualSearchParams::
164 ContextualSearchParams()
166 start(base::string16::npos
),
167 end(base::string16::npos
),
171 TemplateURLRef::SearchTermsArgs::ContextualSearchParams::
172 ContextualSearchParams(
174 const std::string
& selection
,
175 const std::string
& base_page_url
,
178 start(base::string16::npos
),
179 end(base::string16::npos
),
180 selection(selection
),
181 base_page_url(base_page_url
),
185 TemplateURLRef::SearchTermsArgs::ContextualSearchParams::
186 ContextualSearchParams(
190 const std::string
& selection
,
191 const std::string
& content
,
192 const std::string
& base_page_url
,
193 const std::string
& encoding
,
198 selection(selection
),
200 base_page_url(base_page_url
),
205 TemplateURLRef::SearchTermsArgs::ContextualSearchParams::
206 ~ContextualSearchParams() {
209 // TemplateURLRef -------------------------------------------------------------
211 TemplateURLRef::TemplateURLRef(const TemplateURL
* owner
, Type type
)
217 supports_replacements_(false),
218 search_term_position_in_path_(std::string::npos
),
219 search_term_key_location_(url::Parsed::QUERY
),
220 prepopulated_(false) {
222 DCHECK_NE(INDEXED
, type_
);
225 TemplateURLRef::TemplateURLRef(const TemplateURL
* owner
, size_t index_in_owner
)
228 index_in_owner_(index_in_owner
),
231 supports_replacements_(false),
232 search_term_position_in_path_(std::string::npos
),
233 search_term_key_location_(url::Parsed::QUERY
),
234 prepopulated_(false) {
236 DCHECK_LT(index_in_owner_
, owner_
->URLCount());
239 TemplateURLRef::~TemplateURLRef() {
242 std::string
TemplateURLRef::GetURL() const {
244 case SEARCH
: return owner_
->url();
245 case SUGGEST
: return owner_
->suggestions_url();
246 case INSTANT
: return owner_
->instant_url();
247 case IMAGE
: return owner_
->image_url();
248 case NEW_TAB
: return owner_
->new_tab_url();
249 case CONTEXTUAL_SEARCH
: return owner_
->contextual_search_url();
250 case INDEXED
: return owner_
->GetURL(index_in_owner_
);
251 default: NOTREACHED(); return std::string(); // NOLINT
255 std::string
TemplateURLRef::GetPostParamsString() const {
258 case SEARCH
: return owner_
->search_url_post_params();
259 case SUGGEST
: return owner_
->suggestions_url_post_params();
260 case INSTANT
: return owner_
->instant_url_post_params();
261 case NEW_TAB
: return std::string();
262 case CONTEXTUAL_SEARCH
: return std::string();
263 case IMAGE
: return owner_
->image_url_post_params();
264 default: NOTREACHED(); return std::string(); // NOLINT
268 bool TemplateURLRef::UsesPOSTMethod(
269 const SearchTermsData
& search_terms_data
) const {
270 ParseIfNecessary(search_terms_data
);
271 return !post_params_
.empty();
274 bool TemplateURLRef::EncodeFormData(const PostParams
& post_params
,
275 PostContent
* post_content
) const {
276 if (post_params
.empty())
281 const char kUploadDataMIMEType
[] = "multipart/form-data; boundary=";
282 const char kMultipartBoundary
[] = "----+*+----%016" PRIx64
"----+*+----";
283 // Each name/value pair is stored in a body part which is preceded by a
284 // boundary delimiter line. Uses random number generator here to create
285 // a unique boundary delimiter for form data encoding.
286 std::string boundary
= base::StringPrintf(kMultipartBoundary
,
288 // Sets the content MIME type.
289 post_content
->first
= kUploadDataMIMEType
;
290 post_content
->first
+= boundary
;
291 // Encodes the post parameters.
292 std::string
* post_data
= &post_content
->second
;
294 for (const auto& param
: post_params
) {
295 DCHECK(!param
.name
.empty());
296 net::AddMultipartValueForUpload(param
.name
, param
.value
, boundary
,
297 param
.content_type
, post_data
);
299 net::AddMultipartFinalDelimiterForUpload(boundary
, post_data
);
303 bool TemplateURLRef::SupportsReplacement(
304 const SearchTermsData
& search_terms_data
) const {
305 ParseIfNecessary(search_terms_data
);
306 return valid_
&& supports_replacements_
;
309 std::string
TemplateURLRef::ReplaceSearchTerms(
310 const SearchTermsArgs
& search_terms_args
,
311 const SearchTermsData
& search_terms_data
,
312 PostContent
* post_content
) const {
313 ParseIfNecessary(search_terms_data
);
315 return std::string();
317 std::string
url(HandleReplacements(search_terms_args
, search_terms_data
,
321 if (!gurl
.is_valid())
324 std::vector
<std::string
> query_params
;
325 if (search_terms_args
.append_extra_query_params
) {
326 std::string
extra_params(
327 base::CommandLine::ForCurrentProcess()->GetSwitchValueASCII(
328 switches::kExtraSearchQueryParams
));
329 if (!extra_params
.empty())
330 query_params
.push_back(extra_params
);
332 if (!search_terms_args
.suggest_query_params
.empty())
333 query_params
.push_back(search_terms_args
.suggest_query_params
);
334 if (!gurl
.query().empty())
335 query_params
.push_back(gurl
.query());
337 if (query_params
.empty())
340 GURL::Replacements replacements
;
341 std::string query_str
= base::JoinString(query_params
, "&");
342 replacements
.SetQueryStr(query_str
);
343 return gurl
.ReplaceComponents(replacements
).possibly_invalid_spec();
346 bool TemplateURLRef::IsValid(const SearchTermsData
& search_terms_data
) const {
347 ParseIfNecessary(search_terms_data
);
351 base::string16
TemplateURLRef::DisplayURL(
352 const SearchTermsData
& search_terms_data
) const {
353 ParseIfNecessary(search_terms_data
);
354 std::string
result(GetURL());
355 if (valid_
&& !replacements_
.empty()) {
356 base::ReplaceSubstringsAfterOffset(&result
, 0,
357 kSearchTermsParameterFull
,
358 kDisplaySearchTerms
);
359 base::ReplaceSubstringsAfterOffset(&result
, 0,
360 kGoogleUnescapedSearchTermsParameterFull
,
361 kDisplayUnescapedSearchTerms
);
363 return base::UTF8ToUTF16(result
);
367 std::string
TemplateURLRef::DisplayURLToURLRef(
368 const base::string16
& display_url
) {
369 std::string result
= base::UTF16ToUTF8(display_url
);
370 base::ReplaceSubstringsAfterOffset(&result
, 0,
372 kSearchTermsParameterFull
);
373 base::ReplaceSubstringsAfterOffset(&result
, 0,
374 kDisplayUnescapedSearchTerms
,
375 kGoogleUnescapedSearchTermsParameterFull
);
379 const std::string
& TemplateURLRef::GetHost(
380 const SearchTermsData
& search_terms_data
) const {
381 ParseIfNecessary(search_terms_data
);
385 const std::string
& TemplateURLRef::GetPath(
386 const SearchTermsData
& search_terms_data
) const {
387 ParseIfNecessary(search_terms_data
);
391 const std::string
& TemplateURLRef::GetSearchTermKey(
392 const SearchTermsData
& search_terms_data
) const {
393 ParseIfNecessary(search_terms_data
);
394 return search_term_key_
;
397 size_t TemplateURLRef::GetSearchTermPositionInPath(
398 const SearchTermsData
& search_terms_data
) const {
399 ParseIfNecessary(search_terms_data
);
400 return search_term_position_in_path_
;
403 url::Parsed::ComponentType
TemplateURLRef::GetSearchTermKeyLocation(
404 const SearchTermsData
& search_terms_data
) const {
405 ParseIfNecessary(search_terms_data
);
406 return search_term_key_location_
;
409 base::string16
TemplateURLRef::SearchTermToString16(
410 const std::string
& term
) const {
411 const std::vector
<std::string
>& encodings
= owner_
->input_encodings();
412 base::string16 result
;
414 net::UnescapeRule::Type unescape_rules
=
415 net::UnescapeRule::SPACES
| net::UnescapeRule::URL_SPECIAL_CHARS
;
416 if (search_term_key_location_
!= url::Parsed::PATH
)
417 unescape_rules
|= net::UnescapeRule::REPLACE_PLUS_WITH_SPACE
;
419 std::string unescaped
= net::UnescapeURLComponent(term
, unescape_rules
);
420 for (size_t i
= 0; i
< encodings
.size(); ++i
) {
421 if (base::CodepageToUTF16(unescaped
, encodings
[i
].c_str(),
422 base::OnStringConversionError::FAIL
, &result
))
426 // Always fall back on UTF-8 if it works.
427 if (base::CodepageToUTF16(unescaped
, base::kCodepageUTF8
,
428 base::OnStringConversionError::FAIL
, &result
))
431 // When nothing worked, just use the escaped text. We have no idea what the
432 // encoding is. We need to substitute spaces for pluses ourselves since we're
433 // not sending it through an unescaper.
434 result
= base::UTF8ToUTF16(term
);
435 if (unescape_rules
& net::UnescapeRule::REPLACE_PLUS_WITH_SPACE
)
436 std::replace(result
.begin(), result
.end(), '+', ' ');
440 bool TemplateURLRef::HasGoogleBaseURLs(
441 const SearchTermsData
& search_terms_data
) const {
442 ParseIfNecessary(search_terms_data
);
443 for (size_t i
= 0; i
< replacements_
.size(); ++i
) {
444 if ((replacements_
[i
].type
== GOOGLE_BASE_URL
) ||
445 (replacements_
[i
].type
== GOOGLE_BASE_SUGGEST_URL
))
451 bool TemplateURLRef::ExtractSearchTermsFromURL(
453 base::string16
* search_terms
,
454 const SearchTermsData
& search_terms_data
,
455 url::Parsed::ComponentType
* search_terms_component
,
456 url::Component
* search_terms_position
) const {
457 DCHECK(search_terms
);
458 search_terms
->clear();
460 ParseIfNecessary(search_terms_data
);
462 // We need a search term in the template URL to extract something.
463 if (search_term_key_
.empty() &&
464 (search_term_key_location_
!= url::Parsed::PATH
))
467 // Fill-in the replacements. We don't care about search terms in the pattern,
468 // so we use the empty string.
469 // Currently we assume the search term only shows in URL, not in post params.
470 GURL
pattern(ReplaceSearchTerms(SearchTermsArgs(base::string16()),
471 search_terms_data
, NULL
));
472 // Host, path and port must match.
473 if ((url
.port() != pattern
.port()) ||
474 (url
.host() != host_
) ||
475 ((url
.path() != path_
) &&
476 (search_term_key_location_
!= url::Parsed::PATH
))) {
481 url::Component position
;
483 if (search_term_key_location_
== url::Parsed::PATH
) {
486 // Characters in the path before and after search terms must match.
487 if (source
.length() < path_
.length())
489 position
.begin
= search_term_position_in_path_
;
490 position
.len
= source
.length() - path_
.length();
491 if (source
.substr(0, position
.begin
) + source
.substr(position
.end()) !=
495 DCHECK(search_term_key_location_
== url::Parsed::QUERY
||
496 search_term_key_location_
== url::Parsed::REF
);
497 source
= (search_term_key_location_
== url::Parsed::QUERY
) ?
498 url
.query() : url
.ref();
500 url::Component query
, key
, value
;
501 query
.len
= static_cast<int>(source
.size());
502 bool key_found
= false;
503 while (url::ExtractQueryKeyValue(source
.c_str(), &query
, &key
, &value
)) {
504 if (key
.is_nonempty()) {
505 if (source
.substr(key
.begin
, key
.len
) == search_term_key_
) {
506 // Fail if search term key is found twice.
518 // Extract the search term.
519 *search_terms
= SearchTermToString16(
520 source
.substr(position
.begin
, position
.len
));
521 if (search_terms_component
)
522 *search_terms_component
= search_term_key_location_
;
523 if (search_terms_position
)
524 *search_terms_position
= position
;
528 void TemplateURLRef::InvalidateCachedValues() const {
529 supports_replacements_
= valid_
= parsed_
= false;
532 search_term_key_
.clear();
533 search_term_position_in_path_
= std::string::npos
;
534 search_term_key_location_
= url::Parsed::QUERY
;
535 replacements_
.clear();
536 post_params_
.clear();
539 bool TemplateURLRef::ParseParameter(size_t start
,
542 Replacements
* replacements
) const {
543 DCHECK(start
!= std::string::npos
&&
544 end
!= std::string::npos
&& end
> start
);
545 size_t length
= end
- start
- 1;
546 bool optional
= false;
547 // Make a copy of |url| that can be referenced in StringPieces below. |url| is
548 // modified, so that can't be used in StringPiece.
549 const std::string
original_url(*url
);
550 if (original_url
[end
- 1] == kOptional
) {
555 const base::StringPiece
parameter(original_url
.begin() + start
+ 1,
556 original_url
.begin() + start
+ 1 + length
);
557 const base::StringPiece
full_parameter(original_url
.begin() + start
,
558 original_url
.begin() + end
+ 1);
559 // Remove the parameter from the string. For parameters who replacement is
560 // constant and already known, just replace them directly. For other cases,
561 // like parameters whose values may change over time, use |replacements|.
562 url
->erase(start
, end
- start
+ 1);
563 if (parameter
== kSearchTermsParameter
) {
564 replacements
->push_back(Replacement(SEARCH_TERMS
, start
));
565 } else if (parameter
== "count") {
567 url
->insert(start
, kDefaultCount
);
568 } else if (parameter
== "google:assistedQueryStats") {
569 replacements
->push_back(Replacement(GOOGLE_ASSISTED_QUERY_STATS
, start
));
570 } else if (parameter
== "google:baseURL") {
571 replacements
->push_back(Replacement(GOOGLE_BASE_URL
, start
));
572 } else if (parameter
== "google:baseSuggestURL") {
573 replacements
->push_back(Replacement(GOOGLE_BASE_SUGGEST_URL
, start
));
574 } else if (parameter
== "google:bookmarkBarPinned") {
575 replacements
->push_back(Replacement(GOOGLE_BOOKMARK_BAR_PINNED
, start
));
576 } else if (parameter
== "google:currentPageUrl") {
577 replacements
->push_back(Replacement(GOOGLE_CURRENT_PAGE_URL
, start
));
578 } else if (parameter
== "google:cursorPosition") {
579 replacements
->push_back(Replacement(GOOGLE_CURSOR_POSITION
, start
));
580 } else if (parameter
== "google:forceInstantResults") {
581 replacements
->push_back(Replacement(GOOGLE_FORCE_INSTANT_RESULTS
, start
));
582 } else if (parameter
== "google:imageOriginalHeight") {
583 replacements
->push_back(
584 Replacement(TemplateURLRef::GOOGLE_IMAGE_ORIGINAL_HEIGHT
, start
));
585 } else if (parameter
== "google:imageOriginalWidth") {
586 replacements
->push_back(
587 Replacement(TemplateURLRef::GOOGLE_IMAGE_ORIGINAL_WIDTH
, start
));
588 } else if (parameter
== "google:imageSearchSource") {
589 replacements
->push_back(
590 Replacement(TemplateURLRef::GOOGLE_IMAGE_SEARCH_SOURCE
, start
));
591 } else if (parameter
== "google:imageThumbnail") {
592 replacements
->push_back(
593 Replacement(TemplateURLRef::GOOGLE_IMAGE_THUMBNAIL
, start
));
594 } else if (parameter
== "google:imageURL") {
595 replacements
->push_back(Replacement(TemplateURLRef::GOOGLE_IMAGE_URL
,
597 } else if (parameter
== "google:inputType") {
598 replacements
->push_back(Replacement(TemplateURLRef::GOOGLE_INPUT_TYPE
,
600 } else if (parameter
== "google:instantExtendedEnabledParameter") {
601 replacements
->push_back(Replacement(GOOGLE_INSTANT_EXTENDED_ENABLED
,
603 } else if (parameter
== "google:instantExtendedEnabledKey") {
604 url
->insert(start
, google_util::kInstantExtendedAPIParam
);
605 } else if (parameter
== "google:ntpIsThemedParameter") {
606 replacements
->push_back(Replacement(GOOGLE_NTP_IS_THEMED
, start
));
607 } else if (parameter
== "google:omniboxStartMarginParameter") {
608 replacements
->push_back(Replacement(GOOGLE_OMNIBOX_START_MARGIN
, start
));
609 } else if (parameter
== "google:contextualSearchVersion") {
610 replacements
->push_back(
611 Replacement(GOOGLE_CONTEXTUAL_SEARCH_VERSION
, start
));
612 } else if (parameter
== "google:contextualSearchContextData") {
613 replacements
->push_back(
614 Replacement(GOOGLE_CONTEXTUAL_SEARCH_CONTEXT_DATA
, start
));
615 } else if (parameter
== "google:originalQueryForSuggestion") {
616 replacements
->push_back(Replacement(GOOGLE_ORIGINAL_QUERY_FOR_SUGGESTION
,
618 } else if (parameter
== "google:pageClassification") {
619 replacements
->push_back(Replacement(GOOGLE_PAGE_CLASSIFICATION
, start
));
620 } else if (parameter
== "google:prefetchQuery") {
621 replacements
->push_back(Replacement(GOOGLE_PREFETCH_QUERY
, start
));
622 } else if (parameter
== "google:RLZ") {
623 replacements
->push_back(Replacement(GOOGLE_RLZ
, start
));
624 } else if (parameter
== "google:searchClient") {
625 replacements
->push_back(Replacement(GOOGLE_SEARCH_CLIENT
, start
));
626 } else if (parameter
== "google:searchFieldtrialParameter") {
627 replacements
->push_back(Replacement(GOOGLE_SEARCH_FIELDTRIAL_GROUP
, start
));
628 } else if (parameter
== "google:searchVersion") {
629 replacements
->push_back(Replacement(GOOGLE_SEARCH_VERSION
, start
));
630 } else if (parameter
== "google:sessionToken") {
631 replacements
->push_back(Replacement(GOOGLE_SESSION_TOKEN
, start
));
632 } else if (parameter
== "google:sourceId") {
633 #if defined(OS_ANDROID) || defined(OS_IOS)
634 url
->insert(start
, "sourceid=chrome-mobile&");
636 url
->insert(start
, "sourceid=chrome&");
638 } else if (parameter
== "google:suggestAPIKeyParameter") {
640 net::EscapeQueryParamValue(google_apis::GetAPIKey(), false));
641 } else if (parameter
== "google:suggestClient") {
642 replacements
->push_back(Replacement(GOOGLE_SUGGEST_CLIENT
, start
));
643 } else if (parameter
== "google:suggestRid") {
644 replacements
->push_back(Replacement(GOOGLE_SUGGEST_REQUEST_ID
, start
));
645 } else if (parameter
== kGoogleUnescapedSearchTermsParameter
) {
646 replacements
->push_back(Replacement(GOOGLE_UNESCAPED_SEARCH_TERMS
, start
));
647 } else if (parameter
== "yandex:searchPath") {
648 switch (ui::GetDeviceFormFactor()) {
649 case ui::DEVICE_FORM_FACTOR_DESKTOP
:
650 url
->insert(start
, "yandsearch");
652 case ui::DEVICE_FORM_FACTOR_PHONE
:
653 url
->insert(start
, "touchsearch");
655 case ui::DEVICE_FORM_FACTOR_TABLET
:
656 url
->insert(start
, "padsearch");
659 } else if (parameter
== "inputEncoding") {
660 replacements
->push_back(Replacement(ENCODING
, start
));
661 } else if (parameter
== "language") {
662 replacements
->push_back(Replacement(LANGUAGE
, start
));
663 } else if (parameter
== "outputEncoding") {
665 url
->insert(start
, kOutputEncodingType
);
666 } else if ((parameter
== "startIndex") || (parameter
== "startPage")) {
667 // We don't support these.
669 url
->insert(start
, "1");
670 } else if (!prepopulated_
) {
671 // If it's a prepopulated URL, we know that it's safe to remove unknown
672 // parameters, so just ignore this and return true below. Otherwise it could
673 // be some garbage but can also be a javascript block. Put it back.
674 url
->insert(start
, full_parameter
.data(), full_parameter
.size());
680 std::string
TemplateURLRef::ParseURL(const std::string
& url
,
681 Replacements
* replacements
,
682 PostParams
* post_params
,
685 std::string parsed_url
= url
;
686 for (size_t last
= 0; last
!= std::string::npos
; ) {
687 last
= parsed_url
.find(kStartParameter
, last
);
688 if (last
!= std::string::npos
) {
689 size_t template_end
= parsed_url
.find(kEndParameter
, last
);
690 if (template_end
!= std::string::npos
) {
691 // Since we allow Javascript in the URL, {} pairs could be nested. Match
692 // only leaf pairs with supported parameters.
693 size_t next_template_start
= parsed_url
.find(kStartParameter
, last
+ 1);
694 if (next_template_start
== std::string::npos
||
695 next_template_start
> template_end
) {
696 // If successful, ParseParameter erases from the string as such no
697 // need to update |last|. If failed, move |last| to the end of pair.
698 if (!ParseParameter(last
, template_end
, &parsed_url
, replacements
)) {
699 // |template_end| + 1 may be beyond the end of the string.
703 last
= next_template_start
;
706 // Open brace without a closing brace, return.
707 return std::string();
712 // Handles the post parameters.
713 const std::string
& post_params_string
= GetPostParamsString();
714 if (!post_params_string
.empty()) {
715 for (const base::StringPiece
& cur
: base::SplitStringPiece(
716 post_params_string
, ",",
717 base::TRIM_WHITESPACE
, base::SPLIT_WANT_ALL
)) {
718 // The '=' delimiter is required and the name must be not empty.
719 std::vector
<std::string
> parts
= base::SplitString(
720 cur
, "=", base::TRIM_WHITESPACE
, base::SPLIT_WANT_ALL
);
721 if ((parts
.size() != 2U) || parts
[0].empty())
722 return std::string();
724 std::string
& value
= parts
[1];
725 size_t replacements_size
= replacements
->size();
726 if (IsTemplateParameterString(value
))
727 ParseParameter(0, value
.length() - 1, &value
, replacements
);
728 PostParam param
= { parts
[0], value
};
729 post_params
->push_back(param
);
730 // If there was a replacement added, points its index to last added
732 if (replacements
->size() > replacements_size
) {
733 DCHECK_EQ(replacements_size
+ 1, replacements
->size());
734 Replacement
* r
= &replacements
->back();
735 r
->is_post_param
= true;
736 r
->index
= post_params
->size() - 1;
739 DCHECK(!post_params
->empty());
746 void TemplateURLRef::ParseIfNecessary(
747 const SearchTermsData
& search_terms_data
) const {
749 InvalidateCachedValues();
751 parsed_url_
= ParseURL(GetURL(), &replacements_
, &post_params_
, &valid_
);
752 supports_replacements_
= false;
754 bool has_only_one_search_term
= false;
755 for (Replacements::const_iterator i
= replacements_
.begin();
756 i
!= replacements_
.end(); ++i
) {
757 if ((i
->type
== SEARCH_TERMS
) ||
758 (i
->type
== GOOGLE_UNESCAPED_SEARCH_TERMS
)) {
759 if (has_only_one_search_term
) {
760 has_only_one_search_term
= false;
763 has_only_one_search_term
= true;
764 supports_replacements_
= true;
767 // Only parse the host/key if there is one search term. Technically there
768 // could be more than one term, but it's uncommon; so we punt.
769 if (has_only_one_search_term
)
770 ParseHostAndSearchTermKey(search_terms_data
);
775 void TemplateURLRef::ParseHostAndSearchTermKey(
776 const SearchTermsData
& search_terms_data
) const {
777 std::string
url_string(GetURL());
778 base::ReplaceSubstringsAfterOffset(
779 &url_string
, 0, "{google:baseURL}",
780 search_terms_data
.GoogleBaseURLValue());
781 base::ReplaceSubstringsAfterOffset(
782 &url_string
, 0, "{google:baseSuggestURL}",
783 search_terms_data
.GoogleBaseSuggestURLValue());
785 search_term_key_
.clear();
786 search_term_position_in_path_
= std::string::npos
;
789 search_term_key_location_
= url::Parsed::QUERY
;
791 GURL
url(url_string
);
795 std::string query_key
= FindSearchTermsKey(url
.query());
796 std::string ref_key
= FindSearchTermsKey(url
.ref());
797 url::Component parameter_position
;
798 const bool in_query
= !query_key
.empty();
799 const bool in_ref
= !ref_key
.empty();
800 const bool in_path
= FindSearchTermsInPath(url
.path(), ¶meter_position
);
801 if (in_query
? (in_ref
|| in_path
) : (in_ref
== in_path
))
802 return; // No key or multiple keys found. We only handle having one key.
807 search_term_key_
= query_key
;
808 search_term_key_location_
= url::Parsed::QUERY
;
810 search_term_key_
= ref_key
;
811 search_term_key_location_
= url::Parsed::REF
;
814 DCHECK_GE(parameter_position
.begin
, 1); // Path must start with '/'.
815 search_term_key_location_
= url::Parsed::PATH
;
816 search_term_position_in_path_
= parameter_position
.begin
;
817 // Remove the "{searchTerms}" itself from |path_|.
818 path_
.erase(parameter_position
.begin
, parameter_position
.len
);
822 void TemplateURLRef::HandleReplacement(const std::string
& name
,
823 const std::string
& value
,
824 const Replacement
& replacement
,
825 std::string
* url
) const {
826 size_t pos
= replacement
.index
;
827 if (replacement
.is_post_param
) {
828 DCHECK_LT(pos
, post_params_
.size());
829 DCHECK(!post_params_
[pos
].name
.empty());
830 post_params_
[pos
].value
= value
;
832 url
->insert(pos
, name
.empty() ? value
: (name
+ "=" + value
+ "&"));
836 std::string
TemplateURLRef::HandleReplacements(
837 const SearchTermsArgs
& search_terms_args
,
838 const SearchTermsData
& search_terms_data
,
839 PostContent
* post_content
) const {
840 if (replacements_
.empty()) {
841 if (!post_params_
.empty())
842 EncodeFormData(post_params_
, post_content
);
846 // Determine if the search terms are in the query or before. We're escaping
847 // space as '+' in the former case and as '%20' in the latter case.
848 bool is_in_query
= true;
849 for (Replacements::iterator i
= replacements_
.begin();
850 i
!= replacements_
.end(); ++i
) {
851 if (i
->type
== SEARCH_TERMS
) {
852 base::string16::size_type query_start
= parsed_url_
.find('?');
853 is_in_query
= query_start
!= base::string16::npos
&&
854 (static_cast<base::string16::size_type
>(i
->index
) > query_start
);
859 std::string input_encoding
;
860 base::string16 encoded_terms
;
861 base::string16 encoded_original_query
;
862 owner_
->EncodeSearchTerms(search_terms_args
, is_in_query
, &input_encoding
,
863 &encoded_terms
, &encoded_original_query
);
865 std::string url
= parsed_url_
;
867 // replacements_ is ordered in ascending order, as such we need to iterate
869 for (Replacements::reverse_iterator i
= replacements_
.rbegin();
870 i
!= replacements_
.rend(); ++i
) {
873 HandleReplacement(std::string(), input_encoding
, *i
, &url
);
876 case GOOGLE_ASSISTED_QUERY_STATS
:
877 DCHECK(!i
->is_post_param
);
878 if (!search_terms_args
.assisted_query_stats
.empty()) {
879 // Get the base URL without substituting AQS to avoid infinite
880 // recursion. We need the URL to find out if it meets all
881 // AQS requirements (e.g. HTTPS protocol check).
882 // See TemplateURLRef::SearchTermsArgs for more details.
883 SearchTermsArgs
search_terms_args_without_aqs(search_terms_args
);
884 search_terms_args_without_aqs
.assisted_query_stats
.clear();
885 GURL
base_url(ReplaceSearchTerms(
886 search_terms_args_without_aqs
, search_terms_data
, NULL
));
887 if (base_url
.SchemeIsCryptographic()) {
889 "aqs", search_terms_args
.assisted_query_stats
, *i
, &url
);
894 case GOOGLE_BASE_URL
:
895 DCHECK(!i
->is_post_param
);
897 std::string(), search_terms_data
.GoogleBaseURLValue(), *i
, &url
);
900 case GOOGLE_BASE_SUGGEST_URL
:
901 DCHECK(!i
->is_post_param
);
903 std::string(), search_terms_data
.GoogleBaseSuggestURLValue(), *i
,
907 case GOOGLE_BOOKMARK_BAR_PINNED
:
908 if (search_terms_data
.IsShowingSearchTermsOnSearchResultsPages()) {
909 // Log whether the bookmark bar is pinned when the user is seeing
910 // InstantExtended on the SRP.
911 DCHECK(!i
->is_post_param
);
913 "bmbp", search_terms_args
.bookmark_bar_pinned
? "1" : "0", *i
,
918 case GOOGLE_CURRENT_PAGE_URL
:
919 DCHECK(!i
->is_post_param
);
920 if (!search_terms_args
.current_page_url
.empty()) {
921 const std::string
& escaped_current_page_url
=
922 net::EscapeQueryParamValue(search_terms_args
.current_page_url
,
924 HandleReplacement("url", escaped_current_page_url
, *i
, &url
);
928 case GOOGLE_CURSOR_POSITION
:
929 DCHECK(!i
->is_post_param
);
930 if (search_terms_args
.cursor_position
!= base::string16::npos
)
933 base::StringPrintf("%" PRIuS
, search_terms_args
.cursor_position
),
938 case GOOGLE_FORCE_INSTANT_RESULTS
:
939 DCHECK(!i
->is_post_param
);
940 HandleReplacement(std::string(),
941 search_terms_data
.ForceInstantResultsParam(
942 search_terms_args
.force_instant_results
),
947 case GOOGLE_INPUT_TYPE
:
948 DCHECK(!i
->is_post_param
);
950 "oit", base::IntToString(search_terms_args
.input_type
), *i
, &url
);
953 case GOOGLE_INSTANT_EXTENDED_ENABLED
:
954 DCHECK(!i
->is_post_param
);
955 HandleReplacement(std::string(),
956 search_terms_data
.InstantExtendedEnabledParam(
962 case GOOGLE_NTP_IS_THEMED
:
963 DCHECK(!i
->is_post_param
);
965 std::string(), search_terms_data
.NTPIsThemedParam(), *i
, &url
);
968 case GOOGLE_OMNIBOX_START_MARGIN
:
969 DCHECK(!i
->is_post_param
);
970 if (search_terms_args
.enable_omnibox_start_margin
) {
971 int omnibox_start_margin
= search_terms_data
.OmniboxStartMargin();
972 if (omnibox_start_margin
>= 0) {
973 HandleReplacement("es_sm", base::IntToString(omnibox_start_margin
),
979 case GOOGLE_CONTEXTUAL_SEARCH_VERSION
:
980 if (search_terms_args
.contextual_search_params
.version
>= 0) {
984 search_terms_args
.contextual_search_params
.version
),
990 case GOOGLE_CONTEXTUAL_SEARCH_CONTEXT_DATA
: {
991 DCHECK(!i
->is_post_param
);
992 std::string context_data
;
994 const SearchTermsArgs::ContextualSearchParams
& params
=
995 search_terms_args
.contextual_search_params
;
997 if (params
.start
!= std::string::npos
) {
998 context_data
.append("ctxs_start=" + base::IntToString(
999 params
.start
) + "&");
1002 if (params
.end
!= std::string::npos
) {
1003 context_data
.append("ctxs_end=" + base::IntToString(
1007 if (!params
.selection
.empty())
1008 context_data
.append("q=" + params
.selection
+ "&");
1010 if (!params
.content
.empty())
1011 context_data
.append("ctxs_content=" + params
.content
+ "&");
1013 if (!params
.base_page_url
.empty())
1014 context_data
.append("ctxsl_url=" + params
.base_page_url
+ "&");
1016 if (!params
.encoding
.empty()) {
1017 context_data
.append("ctxs_encoding=" + params
.encoding
+ "&");
1020 context_data
.append(
1021 params
.resolve
? "ctxsl_resolve=1" : "ctxsl_resolve=0");
1023 HandleReplacement(std::string(), context_data
, *i
, &url
);
1027 case GOOGLE_ORIGINAL_QUERY_FOR_SUGGESTION
:
1028 DCHECK(!i
->is_post_param
);
1029 if (search_terms_args
.accepted_suggestion
>= 0 ||
1030 !search_terms_args
.assisted_query_stats
.empty()) {
1032 "oq", base::UTF16ToUTF8(encoded_original_query
), *i
, &url
);
1036 case GOOGLE_PAGE_CLASSIFICATION
:
1037 if (search_terms_args
.page_classification
!=
1038 metrics::OmniboxEventProto::INVALID_SPEC
) {
1040 "pgcl", base::IntToString(search_terms_args
.page_classification
),
1045 case GOOGLE_PREFETCH_QUERY
: {
1046 const std::string
& query
= search_terms_args
.prefetch_query
;
1047 const std::string
& type
= search_terms_args
.prefetch_query_type
;
1048 if (!query
.empty() && !type
.empty()) {
1050 std::string(), "pfq=" + query
+ "&qha=" + type
+ "&", *i
, &url
);
1056 DCHECK(!i
->is_post_param
);
1057 // On platforms that don't have RLZ, we still want this branch
1058 // to happen so that we replace the RLZ template with the
1059 // empty string. (If we don't handle this case, we hit a
1060 // NOTREACHED below.)
1061 base::string16 rlz_string
= search_terms_data
.GetRlzParameterValue(
1062 search_terms_args
.from_app_list
);
1063 if (!rlz_string
.empty()) {
1064 HandleReplacement("rlz", base::UTF16ToUTF8(rlz_string
), *i
, &url
);
1069 case GOOGLE_SEARCH_CLIENT
: {
1070 DCHECK(!i
->is_post_param
);
1071 std::string client
= search_terms_data
.GetSearchClient();
1072 if (!client
.empty())
1073 HandleReplacement("client", client
, *i
, &url
);
1077 case GOOGLE_SEARCH_FIELDTRIAL_GROUP
:
1078 // We are not currently running any fieldtrials that modulate the search
1079 // url. If we do, then we'd have some conditional insert such as:
1080 // url.insert(i->index, used_www ? "gcx=w&" : "gcx=c&");
1083 case GOOGLE_SEARCH_VERSION
:
1084 HandleReplacement("gs_rn", "42", *i
, &url
);
1087 case GOOGLE_SESSION_TOKEN
: {
1088 std::string token
= search_terms_args
.session_token
;
1090 HandleReplacement("psi", token
, *i
, &url
);
1094 case GOOGLE_SUGGEST_CLIENT
:
1096 std::string(), search_terms_data
.GetSuggestClient(), *i
, &url
);
1099 case GOOGLE_SUGGEST_REQUEST_ID
:
1101 std::string(), search_terms_data
.GetSuggestRequestIdentifier(), *i
,
1105 case GOOGLE_UNESCAPED_SEARCH_TERMS
: {
1106 std::string unescaped_terms
;
1107 base::UTF16ToCodepage(search_terms_args
.search_terms
,
1108 input_encoding
.c_str(),
1109 base::OnStringConversionError::SKIP
,
1111 HandleReplacement(std::string(), unescaped_terms
, *i
, &url
);
1117 std::string(), search_terms_data
.GetApplicationLocale(), *i
, &url
);
1122 std::string(), base::UTF16ToUTF8(encoded_terms
), *i
, &url
);
1125 case GOOGLE_IMAGE_THUMBNAIL
:
1127 std::string(), search_terms_args
.image_thumbnail_content
, *i
, &url
);
1128 post_params_
[i
->index
].content_type
= "image/jpeg";
1131 case GOOGLE_IMAGE_URL
:
1132 if (search_terms_args
.image_url
.is_valid()) {
1134 std::string(), search_terms_args
.image_url
.spec(), *i
, &url
);
1138 case GOOGLE_IMAGE_ORIGINAL_WIDTH
:
1139 if (!search_terms_args
.image_original_size
.IsEmpty()) {
1142 base::IntToString(search_terms_args
.image_original_size
.width()),
1147 case GOOGLE_IMAGE_ORIGINAL_HEIGHT
:
1148 if (!search_terms_args
.image_original_size
.IsEmpty()) {
1151 base::IntToString(search_terms_args
.image_original_size
.height()),
1156 case GOOGLE_IMAGE_SEARCH_SOURCE
:
1158 std::string(), search_terms_data
.GoogleImageSearchSource(), *i
,
1168 if (!post_params_
.empty())
1169 EncodeFormData(post_params_
, post_content
);
1175 // TemplateURL ----------------------------------------------------------------
1177 TemplateURL::AssociatedExtensionInfo::AssociatedExtensionInfo(
1179 const std::string
& extension_id
)
1181 extension_id(extension_id
),
1182 wants_to_be_default_engine(false) {
1183 DCHECK_NE(NORMAL
, type
);
1186 TemplateURL::AssociatedExtensionInfo::~AssociatedExtensionInfo() {
1189 TemplateURL::TemplateURL(const TemplateURLData
& data
)
1191 url_ref_(this, TemplateURLRef::SEARCH
),
1192 suggestions_url_ref_(this,
1193 TemplateURLRef::SUGGEST
),
1194 instant_url_ref_(this,
1195 TemplateURLRef::INSTANT
),
1196 image_url_ref_(this, TemplateURLRef::IMAGE
),
1197 new_tab_url_ref_(this, TemplateURLRef::NEW_TAB
),
1198 contextual_search_url_ref_(this, TemplateURLRef::CONTEXTUAL_SEARCH
) {
1199 SetPrepopulateId(data_
.prepopulate_id
);
1201 if (data_
.search_terms_replacement_key
==
1202 "{google:instantExtendedEnabledKey}") {
1203 data_
.search_terms_replacement_key
= google_util::kInstantExtendedAPIParam
;
1207 TemplateURL::~TemplateURL() {
1211 base::string16
TemplateURL::GenerateKeyword(
1213 const std::string
& accept_languages
) {
1214 DCHECK(url
.is_valid());
1215 // Strip "www." off the front of the keyword; otherwise the keyword won't work
1216 // properly. See http://code.google.com/p/chromium/issues/detail?id=6984 .
1217 // |url|'s hostname may be IDN-encoded. Before generating |keyword| from it,
1218 // convert to Unicode using the user's accept-languages, so it won't look like
1219 // a confusing punycode string.
1220 base::string16 keyword
=
1221 net::StripWWW(url_formatter::IDNToUnicode(url
.host(), accept_languages
));
1222 // Special case: if the host was exactly "www." (not sure this can happen but
1223 // perhaps with some weird intranet and custom DNS server?), ensure we at
1224 // least don't return the empty string.
1225 return keyword
.empty() ? base::ASCIIToUTF16("www") : keyword
;
1229 GURL
TemplateURL::GenerateFaviconURL(const GURL
& url
) {
1230 DCHECK(url
.is_valid());
1231 GURL::Replacements rep
;
1233 const char favicon_path
[] = "/favicon.ico";
1234 int favicon_path_len
= arraysize(favicon_path
) - 1;
1236 rep
.SetPath(favicon_path
, url::Component(0, favicon_path_len
));
1237 rep
.ClearUsername();
1238 rep
.ClearPassword();
1241 return url
.ReplaceComponents(rep
);
1245 bool TemplateURL::MatchesData(const TemplateURL
* t_url
,
1246 const TemplateURLData
* data
,
1247 const SearchTermsData
& search_terms_data
) {
1248 if (!t_url
|| !data
)
1249 return !t_url
&& !data
;
1251 return (t_url
->short_name() == data
->short_name()) &&
1252 t_url
->HasSameKeywordAs(*data
, search_terms_data
) &&
1253 (t_url
->url() == data
->url()) &&
1254 (t_url
->suggestions_url() == data
->suggestions_url
) &&
1255 (t_url
->instant_url() == data
->instant_url
) &&
1256 (t_url
->image_url() == data
->image_url
) &&
1257 (t_url
->new_tab_url() == data
->new_tab_url
) &&
1258 (t_url
->search_url_post_params() == data
->search_url_post_params
) &&
1259 (t_url
->suggestions_url_post_params() ==
1260 data
->suggestions_url_post_params
) &&
1261 (t_url
->instant_url_post_params() == data
->instant_url_post_params
) &&
1262 (t_url
->image_url_post_params() == data
->image_url_post_params
) &&
1263 (t_url
->favicon_url() == data
->favicon_url
) &&
1264 (t_url
->safe_for_autoreplace() == data
->safe_for_autoreplace
) &&
1265 (t_url
->show_in_default_list() == data
->show_in_default_list
) &&
1266 (t_url
->input_encodings() == data
->input_encodings
) &&
1267 (t_url
->alternate_urls() == data
->alternate_urls
) &&
1268 (t_url
->search_terms_replacement_key() ==
1269 data
->search_terms_replacement_key
);
1272 base::string16
TemplateURL::AdjustedShortNameForLocaleDirection() const {
1273 base::string16 bidi_safe_short_name
= data_
.short_name();
1274 base::i18n::AdjustStringForLocaleDirection(&bidi_safe_short_name
);
1275 return bidi_safe_short_name
;
1278 bool TemplateURL::ShowInDefaultList(
1279 const SearchTermsData
& search_terms_data
) const {
1280 return data_
.show_in_default_list
&&
1281 url_ref_
.SupportsReplacement(search_terms_data
);
1284 bool TemplateURL::SupportsReplacement(
1285 const SearchTermsData
& search_terms_data
) const {
1286 return url_ref_
.SupportsReplacement(search_terms_data
);
1289 bool TemplateURL::HasGoogleBaseURLs(
1290 const SearchTermsData
& search_terms_data
) const {
1291 return url_ref_
.HasGoogleBaseURLs(search_terms_data
) ||
1292 suggestions_url_ref_
.HasGoogleBaseURLs(search_terms_data
) ||
1293 instant_url_ref_
.HasGoogleBaseURLs(search_terms_data
) ||
1294 image_url_ref_
.HasGoogleBaseURLs(search_terms_data
) ||
1295 new_tab_url_ref_
.HasGoogleBaseURLs(search_terms_data
);
1298 bool TemplateURL::IsGoogleSearchURLWithReplaceableKeyword(
1299 const SearchTermsData
& search_terms_data
) const {
1300 return (GetType() == NORMAL
) &&
1301 url_ref_
.HasGoogleBaseURLs(search_terms_data
) &&
1302 google_util::IsGoogleHostname(base::UTF16ToUTF8(data_
.keyword()),
1303 google_util::DISALLOW_SUBDOMAIN
);
1306 bool TemplateURL::HasSameKeywordAs(
1307 const TemplateURLData
& other
,
1308 const SearchTermsData
& search_terms_data
) const {
1309 return (data_
.keyword() == other
.keyword()) ||
1310 (IsGoogleSearchURLWithReplaceableKeyword(search_terms_data
) &&
1311 TemplateURL(other
).IsGoogleSearchURLWithReplaceableKeyword(
1312 search_terms_data
));
1315 TemplateURL::Type
TemplateURL::GetType() const {
1316 return extension_info_
? extension_info_
->type
: NORMAL
;
1319 std::string
TemplateURL::GetExtensionId() const {
1320 DCHECK(extension_info_
);
1321 return extension_info_
->extension_id
;
1324 size_t TemplateURL::URLCount() const {
1325 // Add 1 for the regular search URL.
1326 return data_
.alternate_urls
.size() + 1;
1329 const std::string
& TemplateURL::GetURL(size_t index
) const {
1330 DCHECK_LT(index
, URLCount());
1332 return (index
< data_
.alternate_urls
.size()) ?
1333 data_
.alternate_urls
[index
] : url();
1336 bool TemplateURL::ExtractSearchTermsFromURL(
1338 const SearchTermsData
& search_terms_data
,
1339 base::string16
* search_terms
) const {
1340 return FindSearchTermsInURL(url
, search_terms_data
, search_terms
, NULL
, NULL
);
1343 bool TemplateURL::IsSearchURL(const GURL
& url
,
1344 const SearchTermsData
& search_terms_data
) const {
1345 base::string16 search_terms
;
1346 return ExtractSearchTermsFromURL(url
, search_terms_data
, &search_terms
) &&
1347 !search_terms
.empty();
1350 bool TemplateURL::HasSearchTermsReplacementKey(const GURL
& url
) const {
1351 // Look for the key both in the query and the ref.
1352 std::string params
[] = {url
.query(), url
.ref()};
1354 for (int i
= 0; i
< 2; ++i
) {
1355 url::Component query
, key
, value
;
1356 query
.len
= static_cast<int>(params
[i
].size());
1357 while (url::ExtractQueryKeyValue(params
[i
].c_str(), &query
, &key
, &value
)) {
1358 if (key
.is_nonempty() &&
1359 params
[i
].substr(key
.begin
, key
.len
) ==
1360 search_terms_replacement_key()) {
1368 bool TemplateURL::ReplaceSearchTermsInURL(
1370 const TemplateURLRef::SearchTermsArgs
& search_terms_args
,
1371 const SearchTermsData
& search_terms_data
,
1373 // TODO(beaudoin): Use AQS from |search_terms_args| too.
1374 url::Parsed::ComponentType search_term_component
;
1375 url::Component search_terms_position
;
1376 base::string16 search_terms
;
1377 if (!FindSearchTermsInURL(url
, search_terms_data
, &search_terms
,
1378 &search_term_component
, &search_terms_position
)) {
1381 DCHECK(search_terms_position
.is_nonempty());
1383 // Query and ref are encoded in the same way.
1384 const bool is_in_query
= (search_term_component
!= url::Parsed::PATH
);
1386 std::string input_encoding
;
1387 base::string16 encoded_terms
;
1388 base::string16 encoded_original_query
;
1389 EncodeSearchTerms(search_terms_args
, is_in_query
, &input_encoding
,
1390 &encoded_terms
, &encoded_original_query
);
1392 std::string old_params
;
1393 if (search_term_component
== url::Parsed::QUERY
) {
1394 old_params
= url
.query();
1395 } else if (search_term_component
== url::Parsed::REF
) {
1396 old_params
= url
.ref();
1398 DCHECK_EQ(search_term_component
, url::Parsed::PATH
);
1399 old_params
= url
.path();
1402 std::string
new_params(old_params
, 0, search_terms_position
.begin
);
1403 new_params
+= base::UTF16ToUTF8(encoded_terms
);
1404 new_params
+= old_params
.substr(search_terms_position
.end());
1405 GURL::Replacements replacements
;
1407 if (search_term_component
== url::Parsed::QUERY
) {
1408 replacements
.SetQueryStr(new_params
);
1409 } else if (search_term_component
== url::Parsed::REF
) {
1410 replacements
.SetRefStr(new_params
);
1412 DCHECK_EQ(search_term_component
, url::Parsed::PATH
);
1413 replacements
.SetPathStr(new_params
);
1416 *result
= url
.ReplaceComponents(replacements
);
1420 void TemplateURL::EncodeSearchTerms(
1421 const TemplateURLRef::SearchTermsArgs
& search_terms_args
,
1423 std::string
* input_encoding
,
1424 base::string16
* encoded_terms
,
1425 base::string16
* encoded_original_query
) const {
1427 std::vector
<std::string
> encodings(input_encodings());
1428 if (std::find(encodings
.begin(), encodings
.end(), "UTF-8") == encodings
.end())
1429 encodings
.push_back("UTF-8");
1430 for (std::vector
<std::string
>::const_iterator
i(encodings
.begin());
1431 i
!= encodings
.end(); ++i
) {
1432 if (TryEncoding(search_terms_args
.search_terms
,
1433 search_terms_args
.original_query
, i
->c_str(),
1434 is_in_query
, encoded_terms
, encoded_original_query
)) {
1435 *input_encoding
= *i
;
1442 GURL
TemplateURL::GenerateSearchURL(
1443 const SearchTermsData
& search_terms_data
) const {
1444 if (!url_ref_
.IsValid(search_terms_data
))
1447 if (!url_ref_
.SupportsReplacement(search_terms_data
))
1450 // Use something obscure for the search terms argument so that in the rare
1451 // case the term replaces the URL it's unlikely another keyword would have the
1453 // TODO(jnd): Add additional parameters to get post data when the search URL
1454 // has post parameters.
1455 return GURL(url_ref_
.ReplaceSearchTerms(
1456 TemplateURLRef::SearchTermsArgs(
1457 base::ASCIIToUTF16("blah.blah.blah.blah.blah")),
1458 search_terms_data
, NULL
));
1461 void TemplateURL::CopyFrom(const TemplateURL
& other
) {
1465 data_
= other
.data_
;
1466 url_ref_
.InvalidateCachedValues();
1467 suggestions_url_ref_
.InvalidateCachedValues();
1468 instant_url_ref_
.InvalidateCachedValues();
1469 SetPrepopulateId(other
.data_
.prepopulate_id
);
1472 void TemplateURL::SetURL(const std::string
& url
) {
1474 url_ref_
.InvalidateCachedValues();
1477 void TemplateURL::SetPrepopulateId(int id
) {
1478 data_
.prepopulate_id
= id
;
1479 const bool prepopulated
= id
> 0;
1480 url_ref_
.prepopulated_
= prepopulated
;
1481 suggestions_url_ref_
.prepopulated_
= prepopulated
;
1482 instant_url_ref_
.prepopulated_
= prepopulated
;
1485 void TemplateURL::ResetKeywordIfNecessary(
1486 const SearchTermsData
& search_terms_data
,
1488 if (IsGoogleSearchURLWithReplaceableKeyword(search_terms_data
) || force
) {
1489 DCHECK(GetType() != OMNIBOX_API_EXTENSION
);
1490 GURL
url(GenerateSearchURL(search_terms_data
));
1493 GenerateKeyword(url
, search_terms_data
.GetAcceptLanguages()));
1497 bool TemplateURL::FindSearchTermsInURL(
1499 const SearchTermsData
& search_terms_data
,
1500 base::string16
* search_terms
,
1501 url::Parsed::ComponentType
* search_term_component
,
1502 url::Component
* search_terms_position
) const {
1503 DCHECK(search_terms
);
1504 search_terms
->clear();
1506 // Try to match with every pattern.
1507 for (size_t i
= 0; i
< URLCount(); ++i
) {
1508 TemplateURLRef
ref(this, i
);
1509 if (ref
.ExtractSearchTermsFromURL(url
, search_terms
, search_terms_data
,
1510 search_term_component
, search_terms_position
)) {
1511 // If ExtractSearchTermsFromURL() returns true and |search_terms| is empty
1512 // it means the pattern matched but no search terms were present. In this
1513 // case we fail immediately without looking for matches in subsequent
1514 // patterns. This means that given patterns
1515 // [ "http://foo/#q={searchTerms}", "http://foo/?q={searchTerms}" ],
1516 // calling ExtractSearchTermsFromURL() on "http://foo/?q=bar#q=' would
1517 // return false. This is important for at least Google, where such URLs
1519 return !search_terms
->empty();