1 // Copyright 2014 The Chromium Authors. All rights reserved. 2 // Use of this source code is governed by a BSD-style license that can be 3 // found in the LICENSE file. 4 5 #include "components/search_engines/template_url.h" 6 7 #include <string> 8 #include <vector> 9 10 #include "base/basictypes.h" 11 #include "base/command_line.h" 12 #include "base/format_macros.h" 13 #include "base/i18n/icu_string_conversions.h" 14 #include "base/i18n/rtl.h" 15 #include "base/logging.h" 16 #include "base/metrics/field_trial.h" 17 #include "base/rand_util.h" 18 #include "base/strings/string_number_conversions.h" 19 #include "base/strings/string_split.h" 20 #include "base/strings/string_util.h" 21 #include "base/strings/stringprintf.h" 22 #include "base/strings/utf_string_conversions.h" 23 #include "components/google/core/browser/google_util.h" 24 #include "components/metrics/proto/omnibox_input_type.pb.h" 25 #include "components/search_engines/search_engines_switches.h" 26 #include "components/search_engines/search_terms_data.h" 27 #include "google_apis/google_api_keys.h" 28 #include "net/base/escape.h" 29 #include "net/base/mime_util.h" 30 #include "net/base/net_util.h" 31 32 namespace { 33 34 // The TemplateURLRef has any number of terms that need to be replaced. Each of 35 // the terms is enclosed in braces. If the character preceeding the final 36 // brace is a ?, it indicates the term is optional and can be replaced with 37 // an empty string. 38 const char kStartParameter = '{'; 39 const char kEndParameter = '}'; 40 const char kOptional = '?'; 41 42 // Known parameters found in the URL. 43 const char kSearchTermsParameter[] = "searchTerms"; 44 const char kSearchTermsParameterFull[] = "{searchTerms}"; 45 const char kCountParameter[] = "count"; 46 const char kStartIndexParameter[] = "startIndex"; 47 const char kStartPageParameter[] = "startPage"; 48 const char kLanguageParameter[] = "language"; 49 const char kInputEncodingParameter[] = "inputEncoding"; 50 const char kOutputEncodingParameter[] = "outputEncoding"; 51 52 const char kGoogleAssistedQueryStatsParameter[] = "google:assistedQueryStats"; 53 54 // Host/Domain Google searches are relative to. 55 const char kGoogleBaseURLParameter[] = "google:baseURL"; 56 const char kGoogleBaseURLParameterFull[] = "{google:baseURL}"; 57 58 // Like google:baseURL, but for the Search Suggest capability. 59 const char kGoogleBaseSuggestURLParameter[] = "google:baseSuggestURL"; 60 const char kGoogleBaseSuggestURLParameterFull[] = "{google:baseSuggestURL}"; 61 const char kGoogleBookmarkBarPinnedParameter[] = "google:bookmarkBarPinned"; 62 const char kGoogleContextualSearchContextData[] = 63 "google:contextualSearchContextData"; 64 const char kGoogleContextualSearchVersion[] = "google:contextualSearchVersion"; 65 const char kGoogleCurrentPageUrlParameter[] = "google:currentPageUrl"; 66 const char kGoogleCursorPositionParameter[] = "google:cursorPosition"; 67 const char kGoogleForceInstantResultsParameter[] = "google:forceInstantResults"; 68 const char kGoogleImageSearchSource[] = "google:imageSearchSource"; 69 const char kGoogleImageThumbnailParameter[] = "google:imageThumbnail"; 70 const char kGoogleImageOriginalWidth[] = "google:imageOriginalWidth"; 71 const char kGoogleImageOriginalHeight[] = "google:imageOriginalHeight"; 72 const char kGoogleImageURLParameter[] = "google:imageURL"; 73 const char kGoogleInputTypeParameter[] = "google:inputType"; 74 const char kGoogleInstantExtendedEnabledParameter[] = 75 "google:instantExtendedEnabledParameter"; 76 const char kGoogleInstantExtendedEnabledKey[] = 77 "google:instantExtendedEnabledKey"; 78 const char kGoogleInstantExtendedEnabledKeyFull[] = 79 "{google:instantExtendedEnabledKey}"; 80 const char kGoogleNTPIsThemedParameter[] = "google:ntpIsThemedParameter"; 81 const char kGoogleOmniboxStartMarginParameter[] = 82 "google:omniboxStartMarginParameter"; 83 const char kGoogleOriginalQueryForSuggestionParameter[] = 84 "google:originalQueryForSuggestion"; 85 const char kGooglePageClassificationParameter[] = "google:pageClassification"; 86 const char kGooglePrefetchQuery[] = "google:prefetchQuery"; 87 const char kGoogleRLZParameter[] = "google:RLZ"; 88 const char kGoogleSearchClient[] = "google:searchClient"; 89 const char kGoogleSearchFieldtrialParameter[] = 90 "google:searchFieldtrialParameter"; 91 const char kGoogleSearchVersion[] = "google:searchVersion"; 92 const char kGoogleSessionToken[] = "google:sessionToken"; 93 const char kGoogleSourceIdParameter[] = "google:sourceId"; 94 const char kGoogleSuggestAPIKeyParameter[] = "google:suggestAPIKeyParameter"; 95 const char kGoogleSuggestClient[] = "google:suggestClient"; 96 const char kGoogleSuggestRequestId[] = "google:suggestRid"; 97 98 // Same as kSearchTermsParameter, with no escaping. 99 const char kGoogleUnescapedSearchTermsParameter[] = 100 "google:unescapedSearchTerms"; 101 const char kGoogleUnescapedSearchTermsParameterFull[] = 102 "{google:unescapedSearchTerms}"; 103 104 // Display value for kSearchTermsParameter. 105 const char kDisplaySearchTerms[] = "%s"; 106 107 // Display value for kGoogleUnescapedSearchTermsParameter. 108 const char kDisplayUnescapedSearchTerms[] = "%S"; 109 110 // Used if the count parameter is not optional. Indicates we want 10 search 111 // results. 112 const char kDefaultCount[] = "10"; 113 114 // Used if the parameter kOutputEncodingParameter is required. 115 const char kOutputEncodingType[] = "UTF-8"; 116 117 // Attempts to encode |terms| and |original_query| in |encoding| and escape 118 // them. |terms| may be escaped as path or query depending on |is_in_query|; 119 // |original_query| is always escaped as query. Returns whether the encoding 120 // process succeeded. 121 bool TryEncoding(const base::string16& terms, 122 const base::string16& original_query, 123 const char* encoding, 124 bool is_in_query, 125 base::string16* escaped_terms, 126 base::string16* escaped_original_query) { 127 DCHECK(escaped_terms); 128 DCHECK(escaped_original_query); 129 std::string encoded_terms; 130 if (!base::UTF16ToCodepage(terms, encoding, 131 base::OnStringConversionError::SKIP, &encoded_terms)) 132 return false; 133 *escaped_terms = base::UTF8ToUTF16(is_in_query ? 134 net::EscapeQueryParamValue(encoded_terms, true) : 135 net::EscapePath(encoded_terms)); 136 if (original_query.empty()) 137 return true; 138 std::string encoded_original_query; 139 if (!base::UTF16ToCodepage(original_query, encoding, 140 base::OnStringConversionError::SKIP, &encoded_original_query)) 141 return false; 142 *escaped_original_query = base::UTF8ToUTF16( 143 net::EscapeQueryParamValue(encoded_original_query, true)); 144 return true; 145 } 146 147 // Extract query key and host given a list of parameters coming from the URL 148 // query or ref. 149 std::string FindSearchTermsKey(const std::string& params) { 150 if (params.empty()) 151 return std::string(); 152 url::Component query, key, value; 153 query.len = static_cast<int>(params.size()); 154 while (url::ExtractQueryKeyValue(params.c_str(), &query, &key, &value)) { 155 if (key.is_nonempty() && value.is_nonempty()) { 156 std::string value_string = params.substr(value.begin, value.len); 157 if (value_string.find(kSearchTermsParameterFull, 0) != 158 std::string::npos || 159 value_string.find(kGoogleUnescapedSearchTermsParameterFull, 0) != 160 std::string::npos) { 161 return params.substr(key.begin, key.len); 162 } 163 } 164 } 165 return std::string(); 166 } 167 168 bool IsTemplateParameterString(const std::string& param) { 169 return (param.length() > 2) && (*(param.begin()) == kStartParameter) && 170 (*(param.rbegin()) == kEndParameter); 171 } 172 173 } // namespace 174 175 176 // TemplateURLRef::SearchTermsArgs -------------------------------------------- 177 178 TemplateURLRef::SearchTermsArgs::SearchTermsArgs( 179 const base::string16& search_terms) 180 : search_terms(search_terms), 181 input_type(metrics::OmniboxInputType::INVALID), 182 accepted_suggestion(NO_SUGGESTIONS_AVAILABLE), 183 cursor_position(base::string16::npos), 184 enable_omnibox_start_margin(false), 185 page_classification(metrics::OmniboxEventProto::INVALID_SPEC), 186 bookmark_bar_pinned(false), 187 append_extra_query_params(false), 188 force_instant_results(false), 189 from_app_list(false), 190 contextual_search_params(ContextualSearchParams()) { 191 } 192 193 TemplateURLRef::SearchTermsArgs::~SearchTermsArgs() { 194 } 195 196 TemplateURLRef::SearchTermsArgs::ContextualSearchParams:: 197 ContextualSearchParams() 198 : version(-1), 199 start(base::string16::npos), 200 end(base::string16::npos), 201 resolve(true) { 202 } 203 204 TemplateURLRef::SearchTermsArgs::ContextualSearchParams:: 205 ContextualSearchParams( 206 const int version, 207 const std::string& selection, 208 const std::string& base_page_url, 209 const bool resolve) 210 : version(version), 211 start(base::string16::npos), 212 end(base::string16::npos), 213 selection(selection), 214 base_page_url(base_page_url), 215 resolve(resolve) { 216 } 217 218 TemplateURLRef::SearchTermsArgs::ContextualSearchParams:: 219 ContextualSearchParams( 220 const int version, 221 const size_t start, 222 const size_t end, 223 const std::string& selection, 224 const std::string& content, 225 const std::string& base_page_url, 226 const std::string& encoding, 227 const bool resolve) 228 : version(version), 229 start(start), 230 end(end), 231 selection(selection), 232 content(content), 233 base_page_url(base_page_url), 234 encoding(encoding), 235 resolve(resolve) { 236 } 237 238 TemplateURLRef::SearchTermsArgs::ContextualSearchParams:: 239 ~ContextualSearchParams() { 240 } 241 242 // TemplateURLRef ------------------------------------------------------------- 243 244 TemplateURLRef::TemplateURLRef(TemplateURL* owner, Type type) 245 : owner_(owner), 246 type_(type), 247 index_in_owner_(0), 248 parsed_(false), 249 valid_(false), 250 supports_replacements_(false), 251 search_term_key_location_(url::Parsed::QUERY), 252 prepopulated_(false) { 253 DCHECK(owner_); 254 DCHECK_NE(INDEXED, type_); 255 } 256 257 TemplateURLRef::TemplateURLRef(TemplateURL* owner, size_t index_in_owner) 258 : owner_(owner), 259 type_(INDEXED), 260 index_in_owner_(index_in_owner), 261 parsed_(false), 262 valid_(false), 263 supports_replacements_(false), 264 search_term_key_location_(url::Parsed::QUERY), 265 prepopulated_(false) { 266 DCHECK(owner_); 267 DCHECK_LT(index_in_owner_, owner_->URLCount()); 268 } 269 270 TemplateURLRef::~TemplateURLRef() { 271 } 272 273 std::string TemplateURLRef::GetURL() const { 274 switch (type_) { 275 case SEARCH: return owner_->url(); 276 case SUGGEST: return owner_->suggestions_url(); 277 case INSTANT: return owner_->instant_url(); 278 case IMAGE: return owner_->image_url(); 279 case NEW_TAB: return owner_->new_tab_url(); 280 case CONTEXTUAL_SEARCH: return owner_->contextual_search_url(); 281 case INDEXED: return owner_->GetURL(index_in_owner_); 282 default: NOTREACHED(); return std::string(); // NOLINT 283 } 284 } 285 286 std::string TemplateURLRef::GetPostParamsString() const { 287 switch (type_) { 288 case INDEXED: 289 case SEARCH: return owner_->search_url_post_params(); 290 case SUGGEST: return owner_->suggestions_url_post_params(); 291 case INSTANT: return owner_->instant_url_post_params(); 292 case NEW_TAB: return std::string(); 293 case CONTEXTUAL_SEARCH: return std::string(); 294 case IMAGE: return owner_->image_url_post_params(); 295 default: NOTREACHED(); return std::string(); // NOLINT 296 } 297 } 298 299 bool TemplateURLRef::UsesPOSTMethod( 300 const SearchTermsData& search_terms_data) const { 301 ParseIfNecessary(search_terms_data); 302 return !post_params_.empty(); 303 } 304 305 bool TemplateURLRef::EncodeFormData(const PostParams& post_params, 306 PostContent* post_content) const { 307 if (post_params.empty()) 308 return true; 309 if (!post_content) 310 return false; 311 312 const char kUploadDataMIMEType[] = "multipart/form-data; boundary="; 313 const char kMultipartBoundary[] = "----+*+----%016" PRIx64 "----+*+----"; 314 // Each name/value pair is stored in a body part which is preceded by a 315 // boundary delimiter line. Uses random number generator here to create 316 // a unique boundary delimiter for form data encoding. 317 std::string boundary = base::StringPrintf(kMultipartBoundary, 318 base::RandUint64()); 319 // Sets the content MIME type. 320 post_content->first = kUploadDataMIMEType; 321 post_content->first += boundary; 322 // Encodes the post parameters. 323 std::string* post_data = &post_content->second; 324 post_data->clear(); 325 for (PostParams::const_iterator param = post_params.begin(); 326 param != post_params.end(); ++param) { 327 DCHECK(!param->first.empty()); 328 net::AddMultipartValueForUpload(param->first, param->second, boundary, 329 std::string(), post_data); 330 } 331 net::AddMultipartFinalDelimiterForUpload(boundary, post_data); 332 return true; 333 } 334 335 bool TemplateURLRef::SupportsReplacement( 336 const SearchTermsData& search_terms_data) const { 337 ParseIfNecessary(search_terms_data); 338 return valid_ && supports_replacements_; 339 } 340 341 std::string TemplateURLRef::ReplaceSearchTerms( 342 const SearchTermsArgs& search_terms_args, 343 const SearchTermsData& search_terms_data, 344 PostContent* post_content) const { 345 ParseIfNecessary(search_terms_data); 346 if (!valid_) 347 return std::string(); 348 349 std::string url(HandleReplacements(search_terms_args, search_terms_data, 350 post_content)); 351 352 GURL gurl(url); 353 if (!gurl.is_valid()) 354 return url; 355 356 std::vector<std::string> query_params; 357 if (search_terms_args.append_extra_query_params) { 358 std::string extra_params( 359 CommandLine::ForCurrentProcess()->GetSwitchValueASCII( 360 switches::kExtraSearchQueryParams)); 361 if (!extra_params.empty()) 362 query_params.push_back(extra_params); 363 } 364 if (!search_terms_args.suggest_query_params.empty()) 365 query_params.push_back(search_terms_args.suggest_query_params); 366 if (!gurl.query().empty()) 367 query_params.push_back(gurl.query()); 368 369 if (query_params.empty()) 370 return url; 371 372 GURL::Replacements replacements; 373 std::string query_str = JoinString(query_params, "&"); 374 replacements.SetQueryStr(query_str); 375 return gurl.ReplaceComponents(replacements).possibly_invalid_spec(); 376 } 377 378 bool TemplateURLRef::IsValid(const SearchTermsData& search_terms_data) const { 379 ParseIfNecessary(search_terms_data); 380 return valid_; 381 } 382 383 base::string16 TemplateURLRef::DisplayURL( 384 const SearchTermsData& search_terms_data) const { 385 ParseIfNecessary(search_terms_data); 386 base::string16 result(base::UTF8ToUTF16(GetURL())); 387 if (valid_ && !replacements_.empty()) { 388 ReplaceSubstringsAfterOffset(&result, 0, 389 base::ASCIIToUTF16(kSearchTermsParameterFull), 390 base::ASCIIToUTF16(kDisplaySearchTerms)); 391 ReplaceSubstringsAfterOffset(&result, 0, 392 base::ASCIIToUTF16(kGoogleUnescapedSearchTermsParameterFull), 393 base::ASCIIToUTF16(kDisplayUnescapedSearchTerms)); 394 } 395 return result; 396 } 397 398 // static 399 std::string TemplateURLRef::DisplayURLToURLRef( 400 const base::string16& display_url) { 401 base::string16 result = display_url; 402 ReplaceSubstringsAfterOffset(&result, 0, 403 base::ASCIIToUTF16(kDisplaySearchTerms), 404 base::ASCIIToUTF16(kSearchTermsParameterFull)); 405 ReplaceSubstringsAfterOffset( 406 &result, 0, 407 base::ASCIIToUTF16(kDisplayUnescapedSearchTerms), 408 base::ASCIIToUTF16(kGoogleUnescapedSearchTermsParameterFull)); 409 return base::UTF16ToUTF8(result); 410 } 411 412 const std::string& TemplateURLRef::GetHost( 413 const SearchTermsData& search_terms_data) const { 414 ParseIfNecessary(search_terms_data); 415 return host_; 416 } 417 418 const std::string& TemplateURLRef::GetPath( 419 const SearchTermsData& search_terms_data) const { 420 ParseIfNecessary(search_terms_data); 421 return path_; 422 } 423 424 const std::string& TemplateURLRef::GetSearchTermKey( 425 const SearchTermsData& search_terms_data) const { 426 ParseIfNecessary(search_terms_data); 427 return search_term_key_; 428 } 429 430 base::string16 TemplateURLRef::SearchTermToString16( 431 const std::string& term) const { 432 const std::vector<std::string>& encodings = owner_->input_encodings(); 433 base::string16 result; 434 435 std::string unescaped = net::UnescapeURLComponent( 436 term, 437 net::UnescapeRule::REPLACE_PLUS_WITH_SPACE | 438 net::UnescapeRule::URL_SPECIAL_CHARS); 439 for (size_t i = 0; i < encodings.size(); ++i) { 440 if (base::CodepageToUTF16(unescaped, encodings[i].c_str(), 441 base::OnStringConversionError::FAIL, &result)) 442 return result; 443 } 444 445 // Always fall back on UTF-8 if it works. 446 if (base::CodepageToUTF16(unescaped, base::kCodepageUTF8, 447 base::OnStringConversionError::FAIL, &result)) 448 return result; 449 450 // When nothing worked, just use the escaped text. We have no idea what the 451 // encoding is. We need to substitute spaces for pluses ourselves since we're 452 // not sending it through an unescaper. 453 result = base::UTF8ToUTF16(term); 454 std::replace(result.begin(), result.end(), '+', ' '); 455 return result; 456 } 457 458 bool TemplateURLRef::HasGoogleBaseURLs( 459 const SearchTermsData& search_terms_data) const { 460 ParseIfNecessary(search_terms_data); 461 for (size_t i = 0; i < replacements_.size(); ++i) { 462 if ((replacements_[i].type == GOOGLE_BASE_URL) || 463 (replacements_[i].type == GOOGLE_BASE_SUGGEST_URL)) 464 return true; 465 } 466 return false; 467 } 468 469 bool TemplateURLRef::ExtractSearchTermsFromURL( 470 const GURL& url, 471 base::string16* search_terms, 472 const SearchTermsData& search_terms_data, 473 url::Parsed::ComponentType* search_terms_component, 474 url::Component* search_terms_position) const { 475 DCHECK(search_terms); 476 search_terms->clear(); 477 478 ParseIfNecessary(search_terms_data); 479 480 // We need a search term in the template URL to extract something. 481 if (search_term_key_.empty()) 482 return false; 483 484 // TODO(beaudoin): Support patterns of the form http://foo/{searchTerms}/ 485 // See crbug.com/153798 486 487 // Fill-in the replacements. We don't care about search terms in the pattern, 488 // so we use the empty string. 489 // Currently we assume the search term only shows in URL, not in post params. 490 GURL pattern(ReplaceSearchTerms(SearchTermsArgs(base::string16()), 491 search_terms_data, NULL)); 492 // Host, path and port must match. 493 if (url.port() != pattern.port() || 494 url.host() != host_ || 495 url.path() != path_) { 496 return false; 497 } 498 499 // Parameter must be present either in the query or the ref. 500 const std::string& params( 501 (search_term_key_location_ == url::Parsed::QUERY) ? 502 url.query() : url.ref()); 503 504 url::Component query, key, value; 505 query.len = static_cast<int>(params.size()); 506 bool key_found = false; 507 while (url::ExtractQueryKeyValue(params.c_str(), &query, &key, &value)) { 508 if (key.is_nonempty()) { 509 if (params.substr(key.begin, key.len) == search_term_key_) { 510 // Fail if search term key is found twice. 511 if (key_found) { 512 search_terms->clear(); 513 return false; 514 } 515 key_found = true; 516 // Extract the search term. 517 *search_terms = net::UnescapeAndDecodeUTF8URLComponent( 518 params.substr(value.begin, value.len), 519 net::UnescapeRule::SPACES | 520 net::UnescapeRule::URL_SPECIAL_CHARS | 521 net::UnescapeRule::REPLACE_PLUS_WITH_SPACE); 522 if (search_terms_component) 523 *search_terms_component = search_term_key_location_; 524 if (search_terms_position) 525 *search_terms_position = value; 526 } 527 } 528 } 529 return key_found; 530 } 531 532 void TemplateURLRef::InvalidateCachedValues() const { 533 supports_replacements_ = valid_ = parsed_ = false; 534 host_.clear(); 535 path_.clear(); 536 search_term_key_.clear(); 537 replacements_.clear(); 538 post_params_.clear(); 539 } 540 541 bool TemplateURLRef::ParseParameter(size_t start, 542 size_t end, 543 std::string* url, 544 Replacements* replacements) const { 545 DCHECK(start != std::string::npos && 546 end != std::string::npos && end > start); 547 size_t length = end - start - 1; 548 bool optional = false; 549 if ((*url)[end - 1] == kOptional) { 550 optional = true; 551 length--; 552 } 553 std::string parameter(url->substr(start + 1, length)); 554 std::string full_parameter(url->substr(start, end - start + 1)); 555 // Remove the parameter from the string. For parameters who replacement is 556 // constant and already known, just replace them directly. For other cases, 557 // like parameters whose values may change over time, use |replacements|. 558 url->erase(start, end - start + 1); 559 if (parameter == kSearchTermsParameter) { 560 replacements->push_back(Replacement(SEARCH_TERMS, start)); 561 } else if (parameter == kCountParameter) { 562 if (!optional) 563 url->insert(start, kDefaultCount); 564 } else if (parameter == kGoogleAssistedQueryStatsParameter) { 565 replacements->push_back(Replacement(GOOGLE_ASSISTED_QUERY_STATS, start)); 566 } else if (parameter == kGoogleBaseURLParameter) { 567 replacements->push_back(Replacement(GOOGLE_BASE_URL, start)); 568 } else if (parameter == kGoogleBaseSuggestURLParameter) { 569 replacements->push_back(Replacement(GOOGLE_BASE_SUGGEST_URL, start)); 570 } else if (parameter == kGoogleBookmarkBarPinnedParameter) { 571 replacements->push_back(Replacement(GOOGLE_BOOKMARK_BAR_PINNED, start)); 572 } else if (parameter == kGoogleCurrentPageUrlParameter) { 573 replacements->push_back(Replacement(GOOGLE_CURRENT_PAGE_URL, start)); 574 } else if (parameter == kGoogleCursorPositionParameter) { 575 replacements->push_back(Replacement(GOOGLE_CURSOR_POSITION, start)); 576 } else if (parameter == kGoogleForceInstantResultsParameter) { 577 replacements->push_back(Replacement(GOOGLE_FORCE_INSTANT_RESULTS, start)); 578 } else if (parameter == kGoogleImageOriginalHeight) { 579 replacements->push_back( 580 Replacement(TemplateURLRef::GOOGLE_IMAGE_ORIGINAL_HEIGHT, start)); 581 } else if (parameter == kGoogleImageOriginalWidth) { 582 replacements->push_back( 583 Replacement(TemplateURLRef::GOOGLE_IMAGE_ORIGINAL_WIDTH, start)); 584 } else if (parameter == kGoogleImageSearchSource) { 585 replacements->push_back( 586 Replacement(TemplateURLRef::GOOGLE_IMAGE_SEARCH_SOURCE, start)); 587 } else if (parameter == kGoogleImageThumbnailParameter) { 588 replacements->push_back( 589 Replacement(TemplateURLRef::GOOGLE_IMAGE_THUMBNAIL, start)); 590 } else if (parameter == kGoogleImageURLParameter) { 591 replacements->push_back(Replacement(TemplateURLRef::GOOGLE_IMAGE_URL, 592 start)); 593 } else if (parameter == kGoogleInputTypeParameter) { 594 replacements->push_back(Replacement(TemplateURLRef::GOOGLE_INPUT_TYPE, 595 start)); 596 } else if (parameter == kGoogleInstantExtendedEnabledParameter) { 597 replacements->push_back(Replacement(GOOGLE_INSTANT_EXTENDED_ENABLED, 598 start)); 599 } else if (parameter == kGoogleInstantExtendedEnabledKey) { 600 url->insert(start, google_util::kInstantExtendedAPIParam); 601 } else if (parameter == kGoogleNTPIsThemedParameter) { 602 replacements->push_back(Replacement(GOOGLE_NTP_IS_THEMED, start)); 603 } else if (parameter == kGoogleOmniboxStartMarginParameter) { 604 replacements->push_back(Replacement(GOOGLE_OMNIBOX_START_MARGIN, start)); 605 } else if (parameter == kGoogleContextualSearchVersion) { 606 replacements->push_back( 607 Replacement(GOOGLE_CONTEXTUAL_SEARCH_VERSION, start)); 608 } else if (parameter == kGoogleContextualSearchContextData) { 609 replacements->push_back( 610 Replacement(GOOGLE_CONTEXTUAL_SEARCH_CONTEXT_DATA, start)); 611 } else if (parameter == kGoogleOriginalQueryForSuggestionParameter) { 612 replacements->push_back(Replacement(GOOGLE_ORIGINAL_QUERY_FOR_SUGGESTION, 613 start)); 614 } else if (parameter == kGooglePageClassificationParameter) { 615 replacements->push_back(Replacement(GOOGLE_PAGE_CLASSIFICATION, start)); 616 } else if (parameter == kGooglePrefetchQuery) { 617 replacements->push_back(Replacement(GOOGLE_PREFETCH_QUERY, start)); 618 } else if (parameter == kGoogleRLZParameter) { 619 replacements->push_back(Replacement(GOOGLE_RLZ, start)); 620 } else if (parameter == kGoogleSearchClient) { 621 replacements->push_back(Replacement(GOOGLE_SEARCH_CLIENT, start)); 622 } else if (parameter == kGoogleSearchFieldtrialParameter) { 623 replacements->push_back(Replacement(GOOGLE_SEARCH_FIELDTRIAL_GROUP, start)); 624 } else if (parameter == kGoogleSearchVersion) { 625 replacements->push_back(Replacement(GOOGLE_SEARCH_VERSION, start)); 626 } else if (parameter == kGoogleSessionToken) { 627 replacements->push_back(Replacement(GOOGLE_SESSION_TOKEN, start)); 628 } else if (parameter == kGoogleSourceIdParameter) { 629 #if defined(OS_ANDROID) 630 url->insert(start, "sourceid=chrome-mobile&"); 631 #else 632 url->insert(start, "sourceid=chrome&"); 633 #endif 634 } else if (parameter == kGoogleSuggestAPIKeyParameter) { 635 url->insert(start, 636 net::EscapeQueryParamValue(google_apis::GetAPIKey(), false)); 637 } else if (parameter == kGoogleSuggestClient) { 638 replacements->push_back(Replacement(GOOGLE_SUGGEST_CLIENT, start)); 639 } else if (parameter == kGoogleSuggestRequestId) { 640 replacements->push_back(Replacement(GOOGLE_SUGGEST_REQUEST_ID, start)); 641 } else if (parameter == kGoogleUnescapedSearchTermsParameter) { 642 replacements->push_back(Replacement(GOOGLE_UNESCAPED_SEARCH_TERMS, start)); 643 } else if (parameter == kInputEncodingParameter) { 644 replacements->push_back(Replacement(ENCODING, start)); 645 } else if (parameter == kLanguageParameter) { 646 replacements->push_back(Replacement(LANGUAGE, start)); 647 } else if (parameter == kOutputEncodingParameter) { 648 if (!optional) 649 url->insert(start, kOutputEncodingType); 650 } else if ((parameter == kStartIndexParameter) || 651 (parameter == kStartPageParameter)) { 652 // We don't support these. 653 if (!optional) 654 url->insert(start, "1"); 655 } else if (!prepopulated_) { 656 // If it's a prepopulated URL, we know that it's safe to remove unknown 657 // parameters, so just ignore this and return true below. Otherwise it could 658 // be some garbage but can also be a javascript block. Put it back. 659 url->insert(start, full_parameter); 660 return false; 661 } 662 return true; 663 } 664 665 std::string TemplateURLRef::ParseURL(const std::string& url, 666 Replacements* replacements, 667 PostParams* post_params, 668 bool* valid) const { 669 *valid = false; 670 std::string parsed_url = url; 671 for (size_t last = 0; last != std::string::npos; ) { 672 last = parsed_url.find(kStartParameter, last); 673 if (last != std::string::npos) { 674 size_t template_end = parsed_url.find(kEndParameter, last); 675 if (template_end != std::string::npos) { 676 // Since we allow Javascript in the URL, {} pairs could be nested. Match 677 // only leaf pairs with supported parameters. 678 size_t next_template_start = parsed_url.find(kStartParameter, last + 1); 679 if (next_template_start == std::string::npos || 680 next_template_start > template_end) { 681 // If successful, ParseParameter erases from the string as such no 682 // need to update |last|. If failed, move |last| to the end of pair. 683 if (!ParseParameter(last, template_end, &parsed_url, replacements)) { 684 // |template_end| + 1 may be beyond the end of the string. 685 last = template_end; 686 } 687 } else { 688 last = next_template_start; 689 } 690 } else { 691 // Open brace without a closing brace, return. 692 return std::string(); 693 } 694 } 695 } 696 697 // Handles the post parameters. 698 const std::string& post_params_string = GetPostParamsString(); 699 if (!post_params_string.empty()) { 700 typedef std::vector<std::string> Strings; 701 Strings param_list; 702 base::SplitString(post_params_string, ',', ¶m_list); 703 704 for (Strings::const_iterator iterator = param_list.begin(); 705 iterator != param_list.end(); ++iterator) { 706 Strings parts; 707 // The '=' delimiter is required and the name must be not empty. 708 base::SplitString(*iterator, '=', &parts); 709 if ((parts.size() != 2U) || parts[0].empty()) 710 return std::string(); 711 712 std::string& value = parts[1]; 713 size_t replacements_size = replacements->size(); 714 if (IsTemplateParameterString(value)) 715 ParseParameter(0, value.length() - 1, &value, replacements); 716 post_params->push_back(std::make_pair(parts[0], value)); 717 // If there was a replacement added, points its index to last added 718 // PostParam. 719 if (replacements->size() > replacements_size) { 720 DCHECK_EQ(replacements_size + 1, replacements->size()); 721 Replacement* r = &replacements->back(); 722 r->is_post_param = true; 723 r->index = post_params->size() - 1; 724 } 725 } 726 DCHECK(!post_params->empty()); 727 } 728 729 *valid = true; 730 return parsed_url; 731 } 732 733 void TemplateURLRef::ParseIfNecessary( 734 const SearchTermsData& search_terms_data) const { 735 if (!parsed_) { 736 InvalidateCachedValues(); 737 parsed_ = true; 738 parsed_url_ = ParseURL(GetURL(), &replacements_, &post_params_, &valid_); 739 supports_replacements_ = false; 740 if (valid_) { 741 bool has_only_one_search_term = false; 742 for (Replacements::const_iterator i = replacements_.begin(); 743 i != replacements_.end(); ++i) { 744 if ((i->type == SEARCH_TERMS) || 745 (i->type == GOOGLE_UNESCAPED_SEARCH_TERMS)) { 746 if (has_only_one_search_term) { 747 has_only_one_search_term = false; 748 break; 749 } 750 has_only_one_search_term = true; 751 supports_replacements_ = true; 752 } 753 } 754 // Only parse the host/key if there is one search term. Technically there 755 // could be more than one term, but it's uncommon; so we punt. 756 if (has_only_one_search_term) 757 ParseHostAndSearchTermKey(search_terms_data); 758 } 759 } 760 } 761 762 void TemplateURLRef::ParseHostAndSearchTermKey( 763 const SearchTermsData& search_terms_data) const { 764 std::string url_string(GetURL()); 765 ReplaceSubstringsAfterOffset(&url_string, 0, 766 kGoogleBaseURLParameterFull, 767 search_terms_data.GoogleBaseURLValue()); 768 ReplaceSubstringsAfterOffset(&url_string, 0, 769 kGoogleBaseSuggestURLParameterFull, 770 search_terms_data.GoogleBaseSuggestURLValue()); 771 772 search_term_key_.clear(); 773 host_.clear(); 774 path_.clear(); 775 search_term_key_location_ = url::Parsed::REF; 776 777 GURL url(url_string); 778 if (!url.is_valid()) 779 return; 780 781 std::string query_key = FindSearchTermsKey(url.query()); 782 std::string ref_key = FindSearchTermsKey(url.ref()); 783 if (query_key.empty() == ref_key.empty()) 784 return; // No key or multiple keys found. We only handle having one key. 785 search_term_key_ = query_key.empty() ? ref_key : query_key; 786 search_term_key_location_ = 787 query_key.empty() ? url::Parsed::REF : url::Parsed::QUERY; 788 host_ = url.host(); 789 path_ = url.path(); 790 } 791 792 void TemplateURLRef::HandleReplacement(const std::string& name, 793 const std::string& value, 794 const Replacement& replacement, 795 std::string* url) const { 796 size_t pos = replacement.index; 797 if (replacement.is_post_param) { 798 DCHECK_LT(pos, post_params_.size()); 799 DCHECK(!post_params_[pos].first.empty()); 800 post_params_[pos].second = value; 801 } else { 802 url->insert(pos, name.empty() ? value : (name + "=" + value + "&")); 803 } 804 } 805 806 std::string TemplateURLRef::HandleReplacements( 807 const SearchTermsArgs& search_terms_args, 808 const SearchTermsData& search_terms_data, 809 PostContent* post_content) const { 810 if (replacements_.empty()) { 811 if (!post_params_.empty()) 812 EncodeFormData(post_params_, post_content); 813 return parsed_url_; 814 } 815 816 // Determine if the search terms are in the query or before. We're escaping 817 // space as '+' in the former case and as '%20' in the latter case. 818 bool is_in_query = true; 819 for (Replacements::iterator i = replacements_.begin(); 820 i != replacements_.end(); ++i) { 821 if (i->type == SEARCH_TERMS) { 822 base::string16::size_type query_start = parsed_url_.find('?'); 823 is_in_query = query_start != base::string16::npos && 824 (static_cast<base::string16::size_type>(i->index) > query_start); 825 break; 826 } 827 } 828 829 std::string input_encoding; 830 base::string16 encoded_terms; 831 base::string16 encoded_original_query; 832 owner_->EncodeSearchTerms(search_terms_args, is_in_query, &input_encoding, 833 &encoded_terms, &encoded_original_query); 834 835 std::string url = parsed_url_; 836 837 // replacements_ is ordered in ascending order, as such we need to iterate 838 // from the back. 839 for (Replacements::reverse_iterator i = replacements_.rbegin(); 840 i != replacements_.rend(); ++i) { 841 switch (i->type) { 842 case ENCODING: 843 HandleReplacement(std::string(), input_encoding, *i, &url); 844 break; 845 846 case GOOGLE_ASSISTED_QUERY_STATS: 847 DCHECK(!i->is_post_param); 848 if (!search_terms_args.assisted_query_stats.empty()) { 849 // Get the base URL without substituting AQS to avoid infinite 850 // recursion. We need the URL to find out if it meets all 851 // AQS requirements (e.g. HTTPS protocol check). 852 // See TemplateURLRef::SearchTermsArgs for more details. 853 SearchTermsArgs search_terms_args_without_aqs(search_terms_args); 854 search_terms_args_without_aqs.assisted_query_stats.clear(); 855 GURL base_url(ReplaceSearchTerms( 856 search_terms_args_without_aqs, search_terms_data, NULL)); 857 if (base_url.SchemeIs(url::kHttpsScheme)) { 858 HandleReplacement( 859 "aqs", search_terms_args.assisted_query_stats, *i, &url); 860 } 861 } 862 break; 863 864 case GOOGLE_BASE_URL: 865 DCHECK(!i->is_post_param); 866 HandleReplacement( 867 std::string(), search_terms_data.GoogleBaseURLValue(), *i, &url); 868 break; 869 870 case GOOGLE_BASE_SUGGEST_URL: 871 DCHECK(!i->is_post_param); 872 HandleReplacement( 873 std::string(), search_terms_data.GoogleBaseSuggestURLValue(), *i, 874 &url); 875 break; 876 877 case GOOGLE_BOOKMARK_BAR_PINNED: 878 if (search_terms_data.IsShowingSearchTermsOnSearchResultsPages()) { 879 // Log whether the bookmark bar is pinned when the user is seeing 880 // InstantExtended on the SRP. 881 DCHECK(!i->is_post_param); 882 HandleReplacement( 883 "bmbp", search_terms_args.bookmark_bar_pinned ? "1" : "0", *i, 884 &url); 885 } 886 break; 887 888 case GOOGLE_CURRENT_PAGE_URL: 889 DCHECK(!i->is_post_param); 890 if (!search_terms_args.current_page_url.empty()) { 891 const std::string& escaped_current_page_url = 892 net::EscapeQueryParamValue(search_terms_args.current_page_url, 893 true); 894 HandleReplacement("url", escaped_current_page_url, *i, &url); 895 } 896 break; 897 898 case GOOGLE_CURSOR_POSITION: 899 DCHECK(!i->is_post_param); 900 if (search_terms_args.cursor_position != base::string16::npos) 901 HandleReplacement( 902 "cp", 903 base::StringPrintf("%" PRIuS, search_terms_args.cursor_position), 904 *i, 905 &url); 906 break; 907 908 case GOOGLE_FORCE_INSTANT_RESULTS: 909 DCHECK(!i->is_post_param); 910 HandleReplacement(std::string(), 911 search_terms_data.ForceInstantResultsParam( 912 search_terms_args.force_instant_results), 913 *i, 914 &url); 915 break; 916 917 case GOOGLE_INPUT_TYPE: 918 DCHECK(!i->is_post_param); 919 HandleReplacement( 920 "oit", base::IntToString(search_terms_args.input_type), *i, &url); 921 break; 922 923 case GOOGLE_INSTANT_EXTENDED_ENABLED: 924 DCHECK(!i->is_post_param); 925 HandleReplacement(std::string(), 926 search_terms_data.InstantExtendedEnabledParam( 927 type_ == SEARCH), 928 *i, 929 &url); 930 break; 931 932 case GOOGLE_NTP_IS_THEMED: 933 DCHECK(!i->is_post_param); 934 HandleReplacement( 935 std::string(), search_terms_data.NTPIsThemedParam(), *i, &url); 936 break; 937 938 case GOOGLE_OMNIBOX_START_MARGIN: 939 DCHECK(!i->is_post_param); 940 if (search_terms_args.enable_omnibox_start_margin) { 941 int omnibox_start_margin = search_terms_data.OmniboxStartMargin(); 942 if (omnibox_start_margin >= 0) { 943 HandleReplacement("es_sm", base::IntToString(omnibox_start_margin), 944 *i, &url); 945 } 946 } 947 break; 948 949 case GOOGLE_CONTEXTUAL_SEARCH_VERSION: 950 if (search_terms_args.contextual_search_params.version >= 0) { 951 HandleReplacement( 952 "ctxs", 953 base::IntToString( 954 search_terms_args.contextual_search_params.version), 955 *i, 956 &url); 957 } 958 break; 959 960 case GOOGLE_CONTEXTUAL_SEARCH_CONTEXT_DATA: { 961 DCHECK(!i->is_post_param); 962 std::string context_data; 963 964 const SearchTermsArgs::ContextualSearchParams& params = 965 search_terms_args.contextual_search_params; 966 967 if (params.start != std::string::npos) { 968 context_data.append("ctxs_start=" + base::IntToString( 969 params.start) + "&"); 970 } 971 972 if (params.end != std::string::npos) { 973 context_data.append("ctxs_end=" + base::IntToString( 974 params.end) + "&"); 975 } 976 977 if (!params.selection.empty()) 978 context_data.append("q=" + params.selection + "&"); 979 980 if (!params.content.empty()) 981 context_data.append("ctxs_content=" + params.content + "&"); 982 983 if (!params.base_page_url.empty()) 984 context_data.append("ctxsl_url=" + params.base_page_url + "&"); 985 986 if (!params.encoding.empty()) { 987 context_data.append("ctxs_encoding=" + params.encoding + "&"); 988 } 989 990 context_data.append( 991 params.resolve ? "ctxsl_resolve=1" : "ctxsl_resolve=0"); 992 993 HandleReplacement(std::string(), context_data, *i, &url); 994 break; 995 } 996 997 case GOOGLE_ORIGINAL_QUERY_FOR_SUGGESTION: 998 DCHECK(!i->is_post_param); 999 if (search_terms_args.accepted_suggestion >= 0 || 1000 !search_terms_args.assisted_query_stats.empty()) { 1001 HandleReplacement( 1002 "oq", base::UTF16ToUTF8(encoded_original_query), *i, &url); 1003 } 1004 break; 1005 1006 case GOOGLE_PAGE_CLASSIFICATION: 1007 if (search_terms_args.page_classification != 1008 metrics::OmniboxEventProto::INVALID_SPEC) { 1009 HandleReplacement( 1010 "pgcl", base::IntToString(search_terms_args.page_classification), 1011 *i, &url); 1012 } 1013 break; 1014 1015 case GOOGLE_PREFETCH_QUERY: { 1016 const std::string& query = search_terms_args.prefetch_query; 1017 const std::string& type = search_terms_args.prefetch_query_type; 1018 if (!query.empty() && !type.empty()) { 1019 HandleReplacement( 1020 std::string(), "pfq=" + query + "&qha=" + type + "&", *i, &url); 1021 } 1022 break; 1023 } 1024 1025 case GOOGLE_RLZ: { 1026 DCHECK(!i->is_post_param); 1027 // On platforms that don't have RLZ, we still want this branch 1028 // to happen so that we replace the RLZ template with the 1029 // empty string. (If we don't handle this case, we hit a 1030 // NOTREACHED below.) 1031 base::string16 rlz_string = search_terms_data.GetRlzParameterValue( 1032 search_terms_args.from_app_list); 1033 if (!rlz_string.empty()) { 1034 HandleReplacement("rlz", base::UTF16ToUTF8(rlz_string), *i, &url); 1035 } 1036 break; 1037 } 1038 1039 case GOOGLE_SEARCH_CLIENT: { 1040 DCHECK(!i->is_post_param); 1041 std::string client = search_terms_data.GetSearchClient(); 1042 if (!client.empty()) 1043 HandleReplacement("client", client, *i, &url); 1044 break; 1045 } 1046 1047 case GOOGLE_SEARCH_FIELDTRIAL_GROUP: 1048 // We are not currently running any fieldtrials that modulate the search 1049 // url. If we do, then we'd have some conditional insert such as: 1050 // url.insert(i->index, used_www ? "gcx=w&" : "gcx=c&"); 1051 break; 1052 1053 case GOOGLE_SEARCH_VERSION: 1054 if (search_terms_data.EnableAnswersInSuggest()) 1055 HandleReplacement("gs_rn", "42", *i, &url); 1056 break; 1057 1058 case GOOGLE_SESSION_TOKEN: { 1059 std::string token = search_terms_args.session_token; 1060 if (!token.empty()) 1061 HandleReplacement("psi", token, *i, &url); 1062 break; 1063 } 1064 1065 case GOOGLE_SUGGEST_CLIENT: 1066 HandleReplacement( 1067 std::string(), search_terms_data.GetSuggestClient(), *i, &url); 1068 break; 1069 1070 case GOOGLE_SUGGEST_REQUEST_ID: 1071 HandleReplacement( 1072 std::string(), search_terms_data.GetSuggestRequestIdentifier(), *i, 1073 &url); 1074 break; 1075 1076 case GOOGLE_UNESCAPED_SEARCH_TERMS: { 1077 std::string unescaped_terms; 1078 base::UTF16ToCodepage(search_terms_args.search_terms, 1079 input_encoding.c_str(), 1080 base::OnStringConversionError::SKIP, 1081 &unescaped_terms); 1082 HandleReplacement(std::string(), unescaped_terms, *i, &url); 1083 break; 1084 } 1085 1086 case LANGUAGE: 1087 HandleReplacement( 1088 std::string(), search_terms_data.GetApplicationLocale(), *i, &url); 1089 break; 1090 1091 case SEARCH_TERMS: 1092 HandleReplacement( 1093 std::string(), base::UTF16ToUTF8(encoded_terms), *i, &url); 1094 break; 1095 1096 case GOOGLE_IMAGE_THUMBNAIL: 1097 HandleReplacement( 1098 std::string(), search_terms_args.image_thumbnail_content, *i, &url); 1099 break; 1100 1101 case GOOGLE_IMAGE_URL: 1102 if (search_terms_args.image_url.is_valid()) { 1103 HandleReplacement( 1104 std::string(), search_terms_args.image_url.spec(), *i, &url); 1105 } 1106 break; 1107 1108 case GOOGLE_IMAGE_ORIGINAL_WIDTH: 1109 if (!search_terms_args.image_original_size.IsEmpty()) { 1110 HandleReplacement( 1111 std::string(), 1112 base::IntToString(search_terms_args.image_original_size.width()), 1113 *i, &url); 1114 } 1115 break; 1116 1117 case GOOGLE_IMAGE_ORIGINAL_HEIGHT: 1118 if (!search_terms_args.image_original_size.IsEmpty()) { 1119 HandleReplacement( 1120 std::string(), 1121 base::IntToString(search_terms_args.image_original_size.height()), 1122 *i, &url); 1123 } 1124 break; 1125 1126 case GOOGLE_IMAGE_SEARCH_SOURCE: 1127 HandleReplacement( 1128 std::string(), search_terms_data.GoogleImageSearchSource(), *i, 1129 &url); 1130 break; 1131 1132 default: 1133 NOTREACHED(); 1134 break; 1135 } 1136 } 1137 1138 if (!post_params_.empty()) 1139 EncodeFormData(post_params_, post_content); 1140 1141 return url; 1142 } 1143 1144 1145 // TemplateURL ---------------------------------------------------------------- 1146 1147 TemplateURL::AssociatedExtensionInfo::AssociatedExtensionInfo( 1148 Type type, 1149 const std::string& extension_id) 1150 : type(type), 1151 extension_id(extension_id), 1152 wants_to_be_default_engine(false) { 1153 DCHECK_NE(NORMAL, type); 1154 } 1155 1156 TemplateURL::AssociatedExtensionInfo::~AssociatedExtensionInfo() { 1157 } 1158 1159 TemplateURL::TemplateURL(const TemplateURLData& data) 1160 : data_(data), 1161 url_ref_(this, TemplateURLRef::SEARCH), 1162 suggestions_url_ref_(this, 1163 TemplateURLRef::SUGGEST), 1164 instant_url_ref_(this, 1165 TemplateURLRef::INSTANT), 1166 image_url_ref_(this, TemplateURLRef::IMAGE), 1167 new_tab_url_ref_(this, TemplateURLRef::NEW_TAB), 1168 contextual_search_url_ref_(this, TemplateURLRef::CONTEXTUAL_SEARCH) { 1169 SetPrepopulateId(data_.prepopulate_id); 1170 1171 if (data_.search_terms_replacement_key == 1172 kGoogleInstantExtendedEnabledKeyFull) { 1173 data_.search_terms_replacement_key = google_util::kInstantExtendedAPIParam; 1174 } 1175 } 1176 1177 TemplateURL::~TemplateURL() { 1178 } 1179 1180 // static 1181 base::string16 TemplateURL::GenerateKeyword(const GURL& url) { 1182 DCHECK(url.is_valid()); 1183 // Strip "www." off the front of the keyword; otherwise the keyword won't work 1184 // properly. See http://code.google.com/p/chromium/issues/detail?id=6984 . 1185 // Special case: if the host was exactly "www." (not sure this can happen but 1186 // perhaps with some weird intranet and custom DNS server?), ensure we at 1187 // least don't return the empty string. 1188 base::string16 keyword(net::StripWWWFromHost(url)); 1189 return keyword.empty() ? base::ASCIIToUTF16("www") : keyword; 1190 } 1191 1192 // static 1193 GURL TemplateURL::GenerateFaviconURL(const GURL& url) { 1194 DCHECK(url.is_valid()); 1195 GURL::Replacements rep; 1196 1197 const char favicon_path[] = "/favicon.ico"; 1198 int favicon_path_len = arraysize(favicon_path) - 1; 1199 1200 rep.SetPath(favicon_path, url::Component(0, favicon_path_len)); 1201 rep.ClearUsername(); 1202 rep.ClearPassword(); 1203 rep.ClearQuery(); 1204 rep.ClearRef(); 1205 return url.ReplaceComponents(rep); 1206 } 1207 1208 // static 1209 bool TemplateURL::MatchesData(const TemplateURL* t_url, 1210 const TemplateURLData* data, 1211 const SearchTermsData& search_terms_data) { 1212 if (!t_url || !data) 1213 return !t_url && !data; 1214 1215 return (t_url->short_name() == data->short_name) && 1216 t_url->HasSameKeywordAs(*data, search_terms_data) && 1217 (t_url->url() == data->url()) && 1218 (t_url->suggestions_url() == data->suggestions_url) && 1219 (t_url->instant_url() == data->instant_url) && 1220 (t_url->image_url() == data->image_url) && 1221 (t_url->new_tab_url() == data->new_tab_url) && 1222 (t_url->search_url_post_params() == data->search_url_post_params) && 1223 (t_url->suggestions_url_post_params() == 1224 data->suggestions_url_post_params) && 1225 (t_url->instant_url_post_params() == data->instant_url_post_params) && 1226 (t_url->image_url_post_params() == data->image_url_post_params) && 1227 (t_url->favicon_url() == data->favicon_url) && 1228 (t_url->safe_for_autoreplace() == data->safe_for_autoreplace) && 1229 (t_url->show_in_default_list() == data->show_in_default_list) && 1230 (t_url->input_encodings() == data->input_encodings) && 1231 (t_url->alternate_urls() == data->alternate_urls) && 1232 (t_url->search_terms_replacement_key() == 1233 data->search_terms_replacement_key); 1234 } 1235 1236 base::string16 TemplateURL::AdjustedShortNameForLocaleDirection() const { 1237 base::string16 bidi_safe_short_name = data_.short_name; 1238 base::i18n::AdjustStringForLocaleDirection(&bidi_safe_short_name); 1239 return bidi_safe_short_name; 1240 } 1241 1242 bool TemplateURL::ShowInDefaultList( 1243 const SearchTermsData& search_terms_data) const { 1244 return data_.show_in_default_list && 1245 url_ref_.SupportsReplacement(search_terms_data); 1246 } 1247 1248 bool TemplateURL::SupportsReplacement( 1249 const SearchTermsData& search_terms_data) const { 1250 return url_ref_.SupportsReplacement(search_terms_data); 1251 } 1252 1253 bool TemplateURL::HasGoogleBaseURLs( 1254 const SearchTermsData& search_terms_data) const { 1255 return url_ref_.HasGoogleBaseURLs(search_terms_data) || 1256 suggestions_url_ref_.HasGoogleBaseURLs(search_terms_data) || 1257 instant_url_ref_.HasGoogleBaseURLs(search_terms_data) || 1258 image_url_ref_.HasGoogleBaseURLs(search_terms_data) || 1259 new_tab_url_ref_.HasGoogleBaseURLs(search_terms_data); 1260 } 1261 1262 bool TemplateURL::IsGoogleSearchURLWithReplaceableKeyword( 1263 const SearchTermsData& search_terms_data) const { 1264 return (GetType() == NORMAL) && 1265 url_ref_.HasGoogleBaseURLs(search_terms_data) && 1266 google_util::IsGoogleHostname(base::UTF16ToUTF8(data_.keyword()), 1267 google_util::DISALLOW_SUBDOMAIN); 1268 } 1269 1270 bool TemplateURL::HasSameKeywordAs( 1271 const TemplateURLData& other, 1272 const SearchTermsData& search_terms_data) const { 1273 return (data_.keyword() == other.keyword()) || 1274 (IsGoogleSearchURLWithReplaceableKeyword(search_terms_data) && 1275 TemplateURL(other).IsGoogleSearchURLWithReplaceableKeyword( 1276 search_terms_data)); 1277 } 1278 1279 TemplateURL::Type TemplateURL::GetType() const { 1280 return extension_info_ ? extension_info_->type : NORMAL; 1281 } 1282 1283 std::string TemplateURL::GetExtensionId() const { 1284 DCHECK(extension_info_); 1285 return extension_info_->extension_id; 1286 } 1287 1288 size_t TemplateURL::URLCount() const { 1289 // Add 1 for the regular search URL. 1290 return data_.alternate_urls.size() + 1; 1291 } 1292 1293 const std::string& TemplateURL::GetURL(size_t index) const { 1294 DCHECK_LT(index, URLCount()); 1295 1296 return (index < data_.alternate_urls.size()) ? 1297 data_.alternate_urls[index] : url(); 1298 } 1299 1300 bool TemplateURL::ExtractSearchTermsFromURL( 1301 const GURL& url, 1302 const SearchTermsData& search_terms_data, 1303 base::string16* search_terms) { 1304 return FindSearchTermsInURL(url, search_terms_data, search_terms, NULL, NULL); 1305 } 1306 1307 bool TemplateURL::IsSearchURL( 1308 const GURL& url, 1309 const SearchTermsData& search_terms_data) { 1310 base::string16 search_terms; 1311 return ExtractSearchTermsFromURL(url, search_terms_data, &search_terms) && 1312 !search_terms.empty(); 1313 } 1314 1315 bool TemplateURL::HasSearchTermsReplacementKey(const GURL& url) const { 1316 // Look for the key both in the query and the ref. 1317 std::string params[] = {url.query(), url.ref()}; 1318 1319 for (int i = 0; i < 2; ++i) { 1320 url::Component query, key, value; 1321 query.len = static_cast<int>(params[i].size()); 1322 while (url::ExtractQueryKeyValue(params[i].c_str(), &query, &key, &value)) { 1323 if (key.is_nonempty() && 1324 params[i].substr(key.begin, key.len) == 1325 search_terms_replacement_key()) { 1326 return true; 1327 } 1328 } 1329 } 1330 return false; 1331 } 1332 1333 bool TemplateURL::ReplaceSearchTermsInURL( 1334 const GURL& url, 1335 const TemplateURLRef::SearchTermsArgs& search_terms_args, 1336 const SearchTermsData& search_terms_data, 1337 GURL* result) { 1338 // TODO(beaudoin): Use AQS from |search_terms_args| too. 1339 url::Parsed::ComponentType search_term_component; 1340 url::Component search_terms_position; 1341 base::string16 search_terms; 1342 if (!FindSearchTermsInURL(url, search_terms_data, &search_terms, 1343 &search_term_component, &search_terms_position)) { 1344 return false; 1345 } 1346 DCHECK(search_terms_position.is_nonempty()); 1347 1348 // FindSearchTermsInURL only returns true for search terms in the query or 1349 // ref, so we can call EncodeSearchTerm with |is_in_query| = true, since query 1350 // and ref are encoded in the same way. 1351 std::string input_encoding; 1352 base::string16 encoded_terms; 1353 base::string16 encoded_original_query; 1354 EncodeSearchTerms(search_terms_args, true, &input_encoding, 1355 &encoded_terms, &encoded_original_query); 1356 1357 std::string old_params( 1358 (search_term_component == url::Parsed::REF) ? url.ref() : url.query()); 1359 std::string new_params(old_params, 0, search_terms_position.begin); 1360 new_params += base::UTF16ToUTF8(search_terms_args.search_terms); 1361 new_params += old_params.substr(search_terms_position.end()); 1362 url::StdStringReplacements<std::string> replacements; 1363 if (search_term_component == url::Parsed::REF) 1364 replacements.SetRefStr(new_params); 1365 else 1366 replacements.SetQueryStr(new_params); 1367 *result = url.ReplaceComponents(replacements); 1368 return true; 1369 } 1370 1371 void TemplateURL::EncodeSearchTerms( 1372 const TemplateURLRef::SearchTermsArgs& search_terms_args, 1373 bool is_in_query, 1374 std::string* input_encoding, 1375 base::string16* encoded_terms, 1376 base::string16* encoded_original_query) const { 1377 1378 std::vector<std::string> encodings(input_encodings()); 1379 if (std::find(encodings.begin(), encodings.end(), "UTF-8") == encodings.end()) 1380 encodings.push_back("UTF-8"); 1381 for (std::vector<std::string>::const_iterator i(encodings.begin()); 1382 i != encodings.end(); ++i) { 1383 if (TryEncoding(search_terms_args.search_terms, 1384 search_terms_args.original_query, i->c_str(), 1385 is_in_query, encoded_terms, encoded_original_query)) { 1386 *input_encoding = *i; 1387 return; 1388 } 1389 } 1390 NOTREACHED(); 1391 } 1392 1393 GURL TemplateURL::GenerateSearchURL( 1394 const SearchTermsData& search_terms_data) const { 1395 if (!url_ref_.IsValid(search_terms_data)) 1396 return GURL(); 1397 1398 if (!url_ref_.SupportsReplacement(search_terms_data)) 1399 return GURL(url()); 1400 1401 // Use something obscure for the search terms argument so that in the rare 1402 // case the term replaces the URL it's unlikely another keyword would have the 1403 // same url. 1404 // TODO(jnd): Add additional parameters to get post data when the search URL 1405 // has post parameters. 1406 return GURL(url_ref_.ReplaceSearchTerms( 1407 TemplateURLRef::SearchTermsArgs( 1408 base::ASCIIToUTF16("blah.blah.blah.blah.blah")), 1409 search_terms_data, NULL)); 1410 } 1411 1412 void TemplateURL::CopyFrom(const TemplateURL& other) { 1413 if (this == &other) 1414 return; 1415 1416 data_ = other.data_; 1417 url_ref_.InvalidateCachedValues(); 1418 suggestions_url_ref_.InvalidateCachedValues(); 1419 instant_url_ref_.InvalidateCachedValues(); 1420 SetPrepopulateId(other.data_.prepopulate_id); 1421 } 1422 1423 void TemplateURL::SetURL(const std::string& url) { 1424 data_.SetURL(url); 1425 url_ref_.InvalidateCachedValues(); 1426 } 1427 1428 void TemplateURL::SetPrepopulateId(int id) { 1429 data_.prepopulate_id = id; 1430 const bool prepopulated = id > 0; 1431 url_ref_.prepopulated_ = prepopulated; 1432 suggestions_url_ref_.prepopulated_ = prepopulated; 1433 instant_url_ref_.prepopulated_ = prepopulated; 1434 } 1435 1436 void TemplateURL::ResetKeywordIfNecessary( 1437 const SearchTermsData& search_terms_data, 1438 bool force) { 1439 if (IsGoogleSearchURLWithReplaceableKeyword(search_terms_data) || force) { 1440 DCHECK(GetType() != OMNIBOX_API_EXTENSION); 1441 GURL url(GenerateSearchURL(search_terms_data)); 1442 if (url.is_valid()) 1443 data_.SetKeyword(GenerateKeyword(url)); 1444 } 1445 } 1446 1447 bool TemplateURL::FindSearchTermsInURL( 1448 const GURL& url, 1449 const SearchTermsData& search_terms_data, 1450 base::string16* search_terms, 1451 url::Parsed::ComponentType* search_term_component, 1452 url::Component* search_terms_position) { 1453 DCHECK(search_terms); 1454 search_terms->clear(); 1455 1456 // Try to match with every pattern. 1457 for (size_t i = 0; i < URLCount(); ++i) { 1458 TemplateURLRef ref(this, i); 1459 if (ref.ExtractSearchTermsFromURL(url, search_terms, search_terms_data, 1460 search_term_component, search_terms_position)) { 1461 // If ExtractSearchTermsFromURL() returns true and |search_terms| is empty 1462 // it means the pattern matched but no search terms were present. In this 1463 // case we fail immediately without looking for matches in subsequent 1464 // patterns. This means that given patterns 1465 // [ "http://foo/#q={searchTerms}", "http://foo/?q={searchTerms}" ], 1466 // calling ExtractSearchTermsFromURL() on "http://foo/?q=bar#q=' would 1467 // return false. This is important for at least Google, where such URLs 1468 // are invalid. 1469 return !search_terms->empty(); 1470 } 1471 } 1472 return false; 1473 } 1474