1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. 2 // Use of this source code is governed by a BSD-style license that can be 3 // found in the LICENSE file. 4 5 #include "chrome/browser/search_engines/template_url.h" 6 7 #include <string> 8 #include <vector> 9 10 #include "base/basictypes.h" 11 #include "base/command_line.h" 12 #include "base/format_macros.h" 13 #include "base/i18n/icu_string_conversions.h" 14 #include "base/i18n/rtl.h" 15 #include "base/logging.h" 16 #include "base/metrics/field_trial.h" 17 #include "base/rand_util.h" 18 #include "base/strings/string_number_conversions.h" 19 #include "base/strings/string_split.h" 20 #include "base/strings/string_util.h" 21 #include "base/strings/stringprintf.h" 22 #include "base/strings/utf_string_conversions.h" 23 #include "chrome/browser/omnibox/omnibox_field_trial.h" 24 #include "chrome/browser/search/search.h" 25 #include "chrome/common/chrome_switches.h" 26 #include "components/google/core/browser/google_util.h" 27 #include "components/metrics/proto/omnibox_input_type.pb.h" 28 #include "components/search_engines/search_terms_data.h" 29 #include "extensions/common/constants.h" 30 #include "google_apis/google_api_keys.h" 31 #include "net/base/escape.h" 32 #include "net/base/mime_util.h" 33 #include "net/base/net_util.h" 34 #include "ui/base/l10n/l10n_util.h" 35 36 namespace { 37 38 // The TemplateURLRef has any number of terms that need to be replaced. Each of 39 // the terms is enclosed in braces. If the character preceeding the final 40 // brace is a ?, it indicates the term is optional and can be replaced with 41 // an empty string. 42 const char kStartParameter = '{'; 43 const char kEndParameter = '}'; 44 const char kOptional = '?'; 45 46 // Known parameters found in the URL. 47 const char kSearchTermsParameter[] = "searchTerms"; 48 const char kSearchTermsParameterFull[] = "{searchTerms}"; 49 const char kCountParameter[] = "count"; 50 const char kStartIndexParameter[] = "startIndex"; 51 const char kStartPageParameter[] = "startPage"; 52 const char kLanguageParameter[] = "language"; 53 const char kInputEncodingParameter[] = "inputEncoding"; 54 const char kOutputEncodingParameter[] = "outputEncoding"; 55 56 const char kGoogleAssistedQueryStatsParameter[] = "google:assistedQueryStats"; 57 58 // Host/Domain Google searches are relative to. 59 const char kGoogleBaseURLParameter[] = "google:baseURL"; 60 const char kGoogleBaseURLParameterFull[] = "{google:baseURL}"; 61 62 // Like google:baseURL, but for the Search Suggest capability. 63 const char kGoogleBaseSuggestURLParameter[] = "google:baseSuggestURL"; 64 const char kGoogleBaseSuggestURLParameterFull[] = "{google:baseSuggestURL}"; 65 const char kGoogleBookmarkBarPinnedParameter[] = "google:bookmarkBarPinned"; 66 const char kGoogleContextualSearchContextData[] = 67 "google:contextualSearchContextData"; 68 const char kGoogleContextualSearchVersion[] = "google:contextualSearchVersion"; 69 const char kGoogleCurrentPageUrlParameter[] = "google:currentPageUrl"; 70 const char kGoogleCursorPositionParameter[] = "google:cursorPosition"; 71 const char kGoogleForceInstantResultsParameter[] = "google:forceInstantResults"; 72 const char kGoogleImageSearchSource[] = "google:imageSearchSource"; 73 const char kGoogleImageThumbnailParameter[] = "google:imageThumbnail"; 74 const char kGoogleImageOriginalWidth[] = "google:imageOriginalWidth"; 75 const char kGoogleImageOriginalHeight[] = "google:imageOriginalHeight"; 76 const char kGoogleImageURLParameter[] = "google:imageURL"; 77 const char kGoogleInputTypeParameter[] = "google:inputType"; 78 const char kGoogleInstantExtendedEnabledParameter[] = 79 "google:instantExtendedEnabledParameter"; 80 const char kGoogleInstantExtendedEnabledKey[] = 81 "google:instantExtendedEnabledKey"; 82 const char kGoogleInstantExtendedEnabledKeyFull[] = 83 "{google:instantExtendedEnabledKey}"; 84 const char kGoogleNTPIsThemedParameter[] = "google:ntpIsThemedParameter"; 85 const char kGoogleOmniboxStartMarginParameter[] = 86 "google:omniboxStartMarginParameter"; 87 const char kGoogleOriginalQueryForSuggestionParameter[] = 88 "google:originalQueryForSuggestion"; 89 const char kGooglePageClassificationParameter[] = "google:pageClassification"; 90 const char kGoogleRLZParameter[] = "google:RLZ"; 91 const char kGoogleSearchClient[] = "google:searchClient"; 92 const char kGoogleSearchFieldtrialParameter[] = 93 "google:searchFieldtrialParameter"; 94 const char kGoogleSearchVersion[] = "google:searchVersion"; 95 const char kGoogleSessionToken[] = "google:sessionToken"; 96 const char kGoogleSourceIdParameter[] = "google:sourceId"; 97 const char kGoogleSuggestAPIKeyParameter[] = "google:suggestAPIKeyParameter"; 98 const char kGoogleSuggestClient[] = "google:suggestClient"; 99 const char kGoogleSuggestRequestId[] = "google:suggestRid"; 100 101 // Same as kSearchTermsParameter, with no escaping. 102 const char kGoogleUnescapedSearchTermsParameter[] = 103 "google:unescapedSearchTerms"; 104 const char kGoogleUnescapedSearchTermsParameterFull[] = 105 "{google:unescapedSearchTerms}"; 106 107 // Display value for kSearchTermsParameter. 108 const char kDisplaySearchTerms[] = "%s"; 109 110 // Display value for kGoogleUnescapedSearchTermsParameter. 111 const char kDisplayUnescapedSearchTerms[] = "%S"; 112 113 // Used if the count parameter is not optional. Indicates we want 10 search 114 // results. 115 const char kDefaultCount[] = "10"; 116 117 // Used if the parameter kOutputEncodingParameter is required. 118 const char kOutputEncodingType[] = "UTF-8"; 119 120 // Attempts to encode |terms| and |original_query| in |encoding| and escape 121 // them. |terms| may be escaped as path or query depending on |is_in_query|; 122 // |original_query| is always escaped as query. Returns whether the encoding 123 // process succeeded. 124 bool TryEncoding(const base::string16& terms, 125 const base::string16& original_query, 126 const char* encoding, 127 bool is_in_query, 128 base::string16* escaped_terms, 129 base::string16* escaped_original_query) { 130 DCHECK(escaped_terms); 131 DCHECK(escaped_original_query); 132 std::string encoded_terms; 133 if (!base::UTF16ToCodepage(terms, encoding, 134 base::OnStringConversionError::SKIP, &encoded_terms)) 135 return false; 136 *escaped_terms = base::UTF8ToUTF16(is_in_query ? 137 net::EscapeQueryParamValue(encoded_terms, true) : 138 net::EscapePath(encoded_terms)); 139 if (original_query.empty()) 140 return true; 141 std::string encoded_original_query; 142 if (!base::UTF16ToCodepage(original_query, encoding, 143 base::OnStringConversionError::SKIP, &encoded_original_query)) 144 return false; 145 *escaped_original_query = base::UTF8ToUTF16( 146 net::EscapeQueryParamValue(encoded_original_query, true)); 147 return true; 148 } 149 150 // Extract query key and host given a list of parameters coming from the URL 151 // query or ref. 152 std::string FindSearchTermsKey(const std::string& params) { 153 if (params.empty()) 154 return std::string(); 155 url::Component query, key, value; 156 query.len = static_cast<int>(params.size()); 157 while (url::ExtractQueryKeyValue(params.c_str(), &query, &key, &value)) { 158 if (key.is_nonempty() && value.is_nonempty()) { 159 std::string value_string = params.substr(value.begin, value.len); 160 if (value_string.find(kSearchTermsParameterFull, 0) != 161 std::string::npos || 162 value_string.find(kGoogleUnescapedSearchTermsParameterFull, 0) != 163 std::string::npos) { 164 return params.substr(key.begin, key.len); 165 } 166 } 167 } 168 return std::string(); 169 } 170 171 bool IsTemplateParameterString(const std::string& param) { 172 return (param.length() > 2) && (*(param.begin()) == kStartParameter) && 173 (*(param.rbegin()) == kEndParameter); 174 } 175 176 bool ShowingSearchTermsOnSRP() { 177 return chrome::IsInstantExtendedAPIEnabled() && 178 chrome::IsQueryExtractionEnabled(); 179 } 180 181 } // namespace 182 183 184 // TemplateURLRef::SearchTermsArgs -------------------------------------------- 185 186 TemplateURLRef::SearchTermsArgs::SearchTermsArgs( 187 const base::string16& search_terms) 188 : search_terms(search_terms), 189 input_type(metrics::OmniboxInputType::INVALID), 190 accepted_suggestion(NO_SUGGESTIONS_AVAILABLE), 191 cursor_position(base::string16::npos), 192 omnibox_start_margin(-1), 193 page_classification(metrics::OmniboxEventProto::INVALID_SPEC), 194 bookmark_bar_pinned(false), 195 append_extra_query_params(false), 196 force_instant_results(false), 197 from_app_list(false), 198 contextual_search_params(ContextualSearchParams()) { 199 } 200 201 TemplateURLRef::SearchTermsArgs::~SearchTermsArgs() { 202 } 203 204 TemplateURLRef::SearchTermsArgs::ContextualSearchParams:: 205 ContextualSearchParams() 206 : version(-1), 207 start(base::string16::npos), 208 end(base::string16::npos) { 209 } 210 211 TemplateURLRef::SearchTermsArgs::ContextualSearchParams:: 212 ContextualSearchParams( 213 const int version, 214 const size_t start, 215 const size_t end, 216 const std::string& selection, 217 const std::string& content, 218 const std::string& base_page_url, 219 const std::string& encoding) 220 : version(version), 221 start(start), 222 end(end), 223 selection(selection), 224 content(content), 225 base_page_url(base_page_url), 226 encoding(encoding) { 227 } 228 229 TemplateURLRef::SearchTermsArgs::ContextualSearchParams:: 230 ~ContextualSearchParams() { 231 } 232 233 // TemplateURLRef ------------------------------------------------------------- 234 235 TemplateURLRef::TemplateURLRef(TemplateURL* owner, Type type) 236 : owner_(owner), 237 type_(type), 238 index_in_owner_(-1), 239 parsed_(false), 240 valid_(false), 241 supports_replacements_(false), 242 search_term_key_location_(url::Parsed::QUERY), 243 prepopulated_(false), 244 showing_search_terms_(ShowingSearchTermsOnSRP()) { 245 DCHECK(owner_); 246 DCHECK_NE(INDEXED, type_); 247 } 248 249 TemplateURLRef::TemplateURLRef(TemplateURL* owner, size_t index_in_owner) 250 : owner_(owner), 251 type_(INDEXED), 252 index_in_owner_(index_in_owner), 253 parsed_(false), 254 valid_(false), 255 supports_replacements_(false), 256 search_term_key_location_(url::Parsed::QUERY), 257 prepopulated_(false), 258 showing_search_terms_(ShowingSearchTermsOnSRP()) { 259 DCHECK(owner_); 260 DCHECK_LT(index_in_owner_, owner_->URLCount()); 261 } 262 263 TemplateURLRef::~TemplateURLRef() { 264 } 265 266 std::string TemplateURLRef::GetURL() const { 267 switch (type_) { 268 case SEARCH: return owner_->url(); 269 case SUGGEST: return owner_->suggestions_url(); 270 case INSTANT: return owner_->instant_url(); 271 case IMAGE: return owner_->image_url(); 272 case NEW_TAB: return owner_->new_tab_url(); 273 case CONTEXTUAL_SEARCH: return owner_->contextual_search_url(); 274 case INDEXED: return owner_->GetURL(index_in_owner_); 275 default: NOTREACHED(); return std::string(); // NOLINT 276 } 277 } 278 279 std::string TemplateURLRef::GetPostParamsString() const { 280 switch (type_) { 281 case INDEXED: 282 case SEARCH: return owner_->search_url_post_params(); 283 case SUGGEST: return owner_->suggestions_url_post_params(); 284 case INSTANT: return owner_->instant_url_post_params(); 285 case NEW_TAB: return std::string(); 286 case CONTEXTUAL_SEARCH: return std::string(); 287 case IMAGE: return owner_->image_url_post_params(); 288 default: NOTREACHED(); return std::string(); // NOLINT 289 } 290 } 291 292 bool TemplateURLRef::UsesPOSTMethod( 293 const SearchTermsData& search_terms_data) const { 294 ParseIfNecessary(search_terms_data); 295 return !post_params_.empty(); 296 } 297 298 bool TemplateURLRef::EncodeFormData(const PostParams& post_params, 299 PostContent* post_content) const { 300 if (post_params.empty()) 301 return true; 302 if (!post_content) 303 return false; 304 305 const char kUploadDataMIMEType[] = "multipart/form-data; boundary="; 306 const char kMultipartBoundary[] = "----+*+----%016" PRIx64 "----+*+----"; 307 // Each name/value pair is stored in a body part which is preceded by a 308 // boundary delimiter line. Uses random number generator here to create 309 // a unique boundary delimiter for form data encoding. 310 std::string boundary = base::StringPrintf(kMultipartBoundary, 311 base::RandUint64()); 312 // Sets the content MIME type. 313 post_content->first = kUploadDataMIMEType; 314 post_content->first += boundary; 315 // Encodes the post parameters. 316 std::string* post_data = &post_content->second; 317 post_data->clear(); 318 for (PostParams::const_iterator param = post_params.begin(); 319 param != post_params.end(); ++param) { 320 DCHECK(!param->first.empty()); 321 net::AddMultipartValueForUpload(param->first, param->second, boundary, 322 std::string(), post_data); 323 } 324 net::AddMultipartFinalDelimiterForUpload(boundary, post_data); 325 return true; 326 } 327 328 bool TemplateURLRef::SupportsReplacement( 329 const SearchTermsData& search_terms_data) const { 330 ParseIfNecessary(search_terms_data); 331 return valid_ && supports_replacements_; 332 } 333 334 std::string TemplateURLRef::ReplaceSearchTerms( 335 const SearchTermsArgs& search_terms_args, 336 const SearchTermsData& search_terms_data, 337 PostContent* post_content) const { 338 ParseIfNecessary(search_terms_data); 339 if (!valid_) 340 return std::string(); 341 342 std::string url(HandleReplacements(search_terms_args, search_terms_data, 343 post_content)); 344 345 GURL gurl(url); 346 if (!gurl.is_valid()) 347 return url; 348 349 std::vector<std::string> query_params; 350 if (search_terms_args.append_extra_query_params) { 351 std::string extra_params( 352 CommandLine::ForCurrentProcess()->GetSwitchValueASCII( 353 switches::kExtraSearchQueryParams)); 354 if (!extra_params.empty()) 355 query_params.push_back(extra_params); 356 } 357 if (!search_terms_args.suggest_query_params.empty()) 358 query_params.push_back(search_terms_args.suggest_query_params); 359 if (!gurl.query().empty()) 360 query_params.push_back(gurl.query()); 361 362 if (query_params.empty()) 363 return url; 364 365 GURL::Replacements replacements; 366 std::string query_str = JoinString(query_params, "&"); 367 replacements.SetQueryStr(query_str); 368 return gurl.ReplaceComponents(replacements).possibly_invalid_spec(); 369 } 370 371 bool TemplateURLRef::IsValid(const SearchTermsData& search_terms_data) const { 372 ParseIfNecessary(search_terms_data); 373 return valid_; 374 } 375 376 base::string16 TemplateURLRef::DisplayURL( 377 const SearchTermsData& search_terms_data) const { 378 ParseIfNecessary(search_terms_data); 379 base::string16 result(base::UTF8ToUTF16(GetURL())); 380 if (valid_ && !replacements_.empty()) { 381 ReplaceSubstringsAfterOffset(&result, 0, 382 base::ASCIIToUTF16(kSearchTermsParameterFull), 383 base::ASCIIToUTF16(kDisplaySearchTerms)); 384 ReplaceSubstringsAfterOffset(&result, 0, 385 base::ASCIIToUTF16(kGoogleUnescapedSearchTermsParameterFull), 386 base::ASCIIToUTF16(kDisplayUnescapedSearchTerms)); 387 } 388 return result; 389 } 390 391 // static 392 std::string TemplateURLRef::DisplayURLToURLRef( 393 const base::string16& display_url) { 394 base::string16 result = display_url; 395 ReplaceSubstringsAfterOffset(&result, 0, 396 base::ASCIIToUTF16(kDisplaySearchTerms), 397 base::ASCIIToUTF16(kSearchTermsParameterFull)); 398 ReplaceSubstringsAfterOffset( 399 &result, 0, 400 base::ASCIIToUTF16(kDisplayUnescapedSearchTerms), 401 base::ASCIIToUTF16(kGoogleUnescapedSearchTermsParameterFull)); 402 return base::UTF16ToUTF8(result); 403 } 404 405 const std::string& TemplateURLRef::GetHost( 406 const SearchTermsData& search_terms_data) const { 407 ParseIfNecessary(search_terms_data); 408 return host_; 409 } 410 411 const std::string& TemplateURLRef::GetPath( 412 const SearchTermsData& search_terms_data) const { 413 ParseIfNecessary(search_terms_data); 414 return path_; 415 } 416 417 const std::string& TemplateURLRef::GetSearchTermKey( 418 const SearchTermsData& search_terms_data) const { 419 ParseIfNecessary(search_terms_data); 420 return search_term_key_; 421 } 422 423 base::string16 TemplateURLRef::SearchTermToString16( 424 const std::string& term) const { 425 const std::vector<std::string>& encodings = owner_->input_encodings(); 426 base::string16 result; 427 428 std::string unescaped = net::UnescapeURLComponent( 429 term, 430 net::UnescapeRule::REPLACE_PLUS_WITH_SPACE | 431 net::UnescapeRule::URL_SPECIAL_CHARS); 432 for (size_t i = 0; i < encodings.size(); ++i) { 433 if (base::CodepageToUTF16(unescaped, encodings[i].c_str(), 434 base::OnStringConversionError::FAIL, &result)) 435 return result; 436 } 437 438 // Always fall back on UTF-8 if it works. 439 if (base::CodepageToUTF16(unescaped, base::kCodepageUTF8, 440 base::OnStringConversionError::FAIL, &result)) 441 return result; 442 443 // When nothing worked, just use the escaped text. We have no idea what the 444 // encoding is. We need to substitute spaces for pluses ourselves since we're 445 // not sending it through an unescaper. 446 result = base::UTF8ToUTF16(term); 447 std::replace(result.begin(), result.end(), '+', ' '); 448 return result; 449 } 450 451 bool TemplateURLRef::HasGoogleBaseURLs( 452 const SearchTermsData& search_terms_data) const { 453 ParseIfNecessary(search_terms_data); 454 for (size_t i = 0; i < replacements_.size(); ++i) { 455 if ((replacements_[i].type == GOOGLE_BASE_URL) || 456 (replacements_[i].type == GOOGLE_BASE_SUGGEST_URL)) 457 return true; 458 } 459 return false; 460 } 461 462 bool TemplateURLRef::ExtractSearchTermsFromURL( 463 const GURL& url, 464 base::string16* search_terms, 465 const SearchTermsData& search_terms_data, 466 url::Parsed::ComponentType* search_terms_component, 467 url::Component* search_terms_position) const { 468 DCHECK(search_terms); 469 search_terms->clear(); 470 471 ParseIfNecessary(search_terms_data); 472 473 // We need a search term in the template URL to extract something. 474 if (search_term_key_.empty()) 475 return false; 476 477 // TODO(beaudoin): Support patterns of the form http://foo/{searchTerms}/ 478 // See crbug.com/153798 479 480 // Fill-in the replacements. We don't care about search terms in the pattern, 481 // so we use the empty string. 482 // Currently we assume the search term only shows in URL, not in post params. 483 GURL pattern(ReplaceSearchTerms(SearchTermsArgs(base::string16()), 484 search_terms_data, NULL)); 485 // Host, path and port must match. 486 if (url.port() != pattern.port() || 487 url.host() != host_ || 488 url.path() != path_) { 489 return false; 490 } 491 492 // Parameter must be present either in the query or the ref. 493 const std::string& params( 494 (search_term_key_location_ == url::Parsed::QUERY) ? 495 url.query() : url.ref()); 496 497 url::Component query, key, value; 498 query.len = static_cast<int>(params.size()); 499 bool key_found = false; 500 while (url::ExtractQueryKeyValue(params.c_str(), &query, &key, &value)) { 501 if (key.is_nonempty()) { 502 if (params.substr(key.begin, key.len) == search_term_key_) { 503 // Fail if search term key is found twice. 504 if (key_found) { 505 search_terms->clear(); 506 return false; 507 } 508 key_found = true; 509 // Extract the search term. 510 *search_terms = net::UnescapeAndDecodeUTF8URLComponent( 511 params.substr(value.begin, value.len), 512 net::UnescapeRule::SPACES | 513 net::UnescapeRule::URL_SPECIAL_CHARS | 514 net::UnescapeRule::REPLACE_PLUS_WITH_SPACE); 515 if (search_terms_component) 516 *search_terms_component = search_term_key_location_; 517 if (search_terms_position) 518 *search_terms_position = value; 519 } 520 } 521 } 522 return key_found; 523 } 524 525 void TemplateURLRef::InvalidateCachedValues() const { 526 supports_replacements_ = valid_ = parsed_ = false; 527 host_.clear(); 528 path_.clear(); 529 search_term_key_.clear(); 530 replacements_.clear(); 531 post_params_.clear(); 532 } 533 534 bool TemplateURLRef::ParseParameter(size_t start, 535 size_t end, 536 std::string* url, 537 Replacements* replacements) const { 538 DCHECK(start != std::string::npos && 539 end != std::string::npos && end > start); 540 size_t length = end - start - 1; 541 bool optional = false; 542 if ((*url)[end - 1] == kOptional) { 543 optional = true; 544 length--; 545 } 546 std::string parameter(url->substr(start + 1, length)); 547 std::string full_parameter(url->substr(start, end - start + 1)); 548 // Remove the parameter from the string. For parameters who replacement is 549 // constant and already known, just replace them directly. For other cases, 550 // like parameters whose values may change over time, use |replacements|. 551 url->erase(start, end - start + 1); 552 if (parameter == kSearchTermsParameter) { 553 replacements->push_back(Replacement(SEARCH_TERMS, start)); 554 } else if (parameter == kCountParameter) { 555 if (!optional) 556 url->insert(start, kDefaultCount); 557 } else if (parameter == kGoogleAssistedQueryStatsParameter) { 558 replacements->push_back(Replacement(GOOGLE_ASSISTED_QUERY_STATS, start)); 559 } else if (parameter == kGoogleBaseURLParameter) { 560 replacements->push_back(Replacement(GOOGLE_BASE_URL, start)); 561 } else if (parameter == kGoogleBaseSuggestURLParameter) { 562 replacements->push_back(Replacement(GOOGLE_BASE_SUGGEST_URL, start)); 563 } else if (parameter == kGoogleBookmarkBarPinnedParameter) { 564 replacements->push_back(Replacement(GOOGLE_BOOKMARK_BAR_PINNED, start)); 565 } else if (parameter == kGoogleCurrentPageUrlParameter) { 566 replacements->push_back(Replacement(GOOGLE_CURRENT_PAGE_URL, start)); 567 } else if (parameter == kGoogleCursorPositionParameter) { 568 replacements->push_back(Replacement(GOOGLE_CURSOR_POSITION, start)); 569 } else if (parameter == kGoogleForceInstantResultsParameter) { 570 replacements->push_back(Replacement(GOOGLE_FORCE_INSTANT_RESULTS, start)); 571 } else if (parameter == kGoogleImageOriginalHeight) { 572 replacements->push_back( 573 Replacement(TemplateURLRef::GOOGLE_IMAGE_ORIGINAL_HEIGHT, start)); 574 } else if (parameter == kGoogleImageOriginalWidth) { 575 replacements->push_back( 576 Replacement(TemplateURLRef::GOOGLE_IMAGE_ORIGINAL_WIDTH, start)); 577 } else if (parameter == kGoogleImageSearchSource) { 578 replacements->push_back( 579 Replacement(TemplateURLRef::GOOGLE_IMAGE_SEARCH_SOURCE, start)); 580 } else if (parameter == kGoogleImageThumbnailParameter) { 581 replacements->push_back( 582 Replacement(TemplateURLRef::GOOGLE_IMAGE_THUMBNAIL, start)); 583 } else if (parameter == kGoogleImageURLParameter) { 584 replacements->push_back(Replacement(TemplateURLRef::GOOGLE_IMAGE_URL, 585 start)); 586 } else if (parameter == kGoogleInputTypeParameter) { 587 replacements->push_back(Replacement(TemplateURLRef::GOOGLE_INPUT_TYPE, 588 start)); 589 } else if (parameter == kGoogleInstantExtendedEnabledParameter) { 590 replacements->push_back(Replacement(GOOGLE_INSTANT_EXTENDED_ENABLED, 591 start)); 592 } else if (parameter == kGoogleInstantExtendedEnabledKey) { 593 url->insert(start, google_util::kInstantExtendedAPIParam); 594 } else if (parameter == kGoogleNTPIsThemedParameter) { 595 replacements->push_back(Replacement(GOOGLE_NTP_IS_THEMED, start)); 596 } else if (parameter == kGoogleOmniboxStartMarginParameter) { 597 replacements->push_back(Replacement(GOOGLE_OMNIBOX_START_MARGIN, start)); 598 } else if (parameter == kGoogleContextualSearchVersion) { 599 replacements->push_back( 600 Replacement(GOOGLE_CONTEXTUAL_SEARCH_VERSION, start)); 601 } else if (parameter == kGoogleContextualSearchContextData) { 602 replacements->push_back( 603 Replacement(GOOGLE_CONTEXTUAL_SEARCH_CONTEXT_DATA, start)); 604 } else if (parameter == kGoogleOriginalQueryForSuggestionParameter) { 605 replacements->push_back(Replacement(GOOGLE_ORIGINAL_QUERY_FOR_SUGGESTION, 606 start)); 607 } else if (parameter == kGooglePageClassificationParameter) { 608 replacements->push_back(Replacement(GOOGLE_PAGE_CLASSIFICATION, start)); 609 } else if (parameter == kGoogleRLZParameter) { 610 replacements->push_back(Replacement(GOOGLE_RLZ, start)); 611 } else if (parameter == kGoogleSearchClient) { 612 replacements->push_back(Replacement(GOOGLE_SEARCH_CLIENT, start)); 613 } else if (parameter == kGoogleSearchFieldtrialParameter) { 614 replacements->push_back(Replacement(GOOGLE_SEARCH_FIELDTRIAL_GROUP, start)); 615 } else if (parameter == kGoogleSearchVersion) { 616 if (OmniboxFieldTrial::EnableAnswersInSuggest()) 617 url->insert(start, "gs_rn=42&"); 618 } else if (parameter == kGoogleSessionToken) { 619 replacements->push_back(Replacement(GOOGLE_SESSION_TOKEN, start)); 620 } else if (parameter == kGoogleSourceIdParameter) { 621 #if defined(OS_ANDROID) 622 url->insert(start, "sourceid=chrome-mobile&"); 623 #else 624 url->insert(start, "sourceid=chrome&"); 625 #endif 626 } else if (parameter == kGoogleSuggestAPIKeyParameter) { 627 url->insert(start, 628 net::EscapeQueryParamValue(google_apis::GetAPIKey(), false)); 629 } else if (parameter == kGoogleSuggestClient) { 630 replacements->push_back(Replacement(GOOGLE_SUGGEST_CLIENT, start)); 631 } else if (parameter == kGoogleSuggestRequestId) { 632 replacements->push_back(Replacement(GOOGLE_SUGGEST_REQUEST_ID, start)); 633 } else if (parameter == kGoogleUnescapedSearchTermsParameter) { 634 replacements->push_back(Replacement(GOOGLE_UNESCAPED_SEARCH_TERMS, start)); 635 } else if (parameter == kInputEncodingParameter) { 636 replacements->push_back(Replacement(ENCODING, start)); 637 } else if (parameter == kLanguageParameter) { 638 replacements->push_back(Replacement(LANGUAGE, start)); 639 } else if (parameter == kOutputEncodingParameter) { 640 if (!optional) 641 url->insert(start, kOutputEncodingType); 642 } else if ((parameter == kStartIndexParameter) || 643 (parameter == kStartPageParameter)) { 644 // We don't support these. 645 if (!optional) 646 url->insert(start, "1"); 647 } else if (!prepopulated_) { 648 // If it's a prepopulated URL, we know that it's safe to remove unknown 649 // parameters, so just ignore this and return true below. Otherwise it could 650 // be some garbage but can also be a javascript block. Put it back. 651 url->insert(start, full_parameter); 652 return false; 653 } 654 return true; 655 } 656 657 std::string TemplateURLRef::ParseURL(const std::string& url, 658 Replacements* replacements, 659 PostParams* post_params, 660 bool* valid) const { 661 *valid = false; 662 std::string parsed_url = url; 663 for (size_t last = 0; last != std::string::npos; ) { 664 last = parsed_url.find(kStartParameter, last); 665 if (last != std::string::npos) { 666 size_t template_end = parsed_url.find(kEndParameter, last); 667 if (template_end != std::string::npos) { 668 // Since we allow Javascript in the URL, {} pairs could be nested. Match 669 // only leaf pairs with supported parameters. 670 size_t next_template_start = parsed_url.find(kStartParameter, last + 1); 671 if (next_template_start == std::string::npos || 672 next_template_start > template_end) { 673 // If successful, ParseParameter erases from the string as such no 674 // need to update |last|. If failed, move |last| to the end of pair. 675 if (!ParseParameter(last, template_end, &parsed_url, replacements)) { 676 // |template_end| + 1 may be beyond the end of the string. 677 last = template_end; 678 } 679 } else { 680 last = next_template_start; 681 } 682 } else { 683 // Open brace without a closing brace, return. 684 return std::string(); 685 } 686 } 687 } 688 689 // Handles the post parameters. 690 const std::string& post_params_string = GetPostParamsString(); 691 if (!post_params_string.empty()) { 692 typedef std::vector<std::string> Strings; 693 Strings param_list; 694 base::SplitString(post_params_string, ',', ¶m_list); 695 696 for (Strings::const_iterator iterator = param_list.begin(); 697 iterator != param_list.end(); ++iterator) { 698 Strings parts; 699 // The '=' delimiter is required and the name must be not empty. 700 base::SplitString(*iterator, '=', &parts); 701 if ((parts.size() != 2U) || parts[0].empty()) 702 return std::string(); 703 704 std::string& value = parts[1]; 705 size_t replacements_size = replacements->size(); 706 if (IsTemplateParameterString(value)) 707 ParseParameter(0, value.length() - 1, &value, replacements); 708 post_params->push_back(std::make_pair(parts[0], value)); 709 // If there was a replacement added, points its index to last added 710 // PostParam. 711 if (replacements->size() > replacements_size) { 712 DCHECK_EQ(replacements_size + 1, replacements->size()); 713 Replacement* r = &replacements->back(); 714 r->is_post_param = true; 715 r->index = post_params->size() - 1; 716 } 717 } 718 DCHECK(!post_params->empty()); 719 } 720 721 *valid = true; 722 return parsed_url; 723 } 724 725 void TemplateURLRef::ParseIfNecessary( 726 const SearchTermsData& search_terms_data) const { 727 if (!parsed_) { 728 InvalidateCachedValues(); 729 parsed_ = true; 730 parsed_url_ = ParseURL(GetURL(), &replacements_, &post_params_, &valid_); 731 supports_replacements_ = false; 732 if (valid_) { 733 bool has_only_one_search_term = false; 734 for (Replacements::const_iterator i = replacements_.begin(); 735 i != replacements_.end(); ++i) { 736 if ((i->type == SEARCH_TERMS) || 737 (i->type == GOOGLE_UNESCAPED_SEARCH_TERMS)) { 738 if (has_only_one_search_term) { 739 has_only_one_search_term = false; 740 break; 741 } 742 has_only_one_search_term = true; 743 supports_replacements_ = true; 744 } 745 } 746 // Only parse the host/key if there is one search term. Technically there 747 // could be more than one term, but it's uncommon; so we punt. 748 if (has_only_one_search_term) 749 ParseHostAndSearchTermKey(search_terms_data); 750 } 751 } 752 } 753 754 void TemplateURLRef::ParseHostAndSearchTermKey( 755 const SearchTermsData& search_terms_data) const { 756 std::string url_string(GetURL()); 757 ReplaceSubstringsAfterOffset(&url_string, 0, 758 kGoogleBaseURLParameterFull, 759 search_terms_data.GoogleBaseURLValue()); 760 ReplaceSubstringsAfterOffset(&url_string, 0, 761 kGoogleBaseSuggestURLParameterFull, 762 search_terms_data.GoogleBaseSuggestURLValue()); 763 764 search_term_key_.clear(); 765 host_.clear(); 766 path_.clear(); 767 search_term_key_location_ = url::Parsed::REF; 768 769 GURL url(url_string); 770 if (!url.is_valid()) 771 return; 772 773 std::string query_key = FindSearchTermsKey(url.query()); 774 std::string ref_key = FindSearchTermsKey(url.ref()); 775 if (query_key.empty() == ref_key.empty()) 776 return; // No key or multiple keys found. We only handle having one key. 777 search_term_key_ = query_key.empty() ? ref_key : query_key; 778 search_term_key_location_ = 779 query_key.empty() ? url::Parsed::REF : url::Parsed::QUERY; 780 host_ = url.host(); 781 path_ = url.path(); 782 } 783 784 void TemplateURLRef::HandleReplacement(const std::string& name, 785 const std::string& value, 786 const Replacement& replacement, 787 std::string* url) const { 788 size_t pos = replacement.index; 789 if (replacement.is_post_param) { 790 DCHECK_LT(pos, post_params_.size()); 791 DCHECK(!post_params_[pos].first.empty()); 792 post_params_[pos].second = value; 793 } else { 794 url->insert(pos, name.empty() ? value : (name + "=" + value + "&")); 795 } 796 } 797 798 std::string TemplateURLRef::HandleReplacements( 799 const SearchTermsArgs& search_terms_args, 800 const SearchTermsData& search_terms_data, 801 PostContent* post_content) const { 802 if (replacements_.empty()) { 803 if (!post_params_.empty()) 804 EncodeFormData(post_params_, post_content); 805 return parsed_url_; 806 } 807 808 // Determine if the search terms are in the query or before. We're escaping 809 // space as '+' in the former case and as '%20' in the latter case. 810 bool is_in_query = true; 811 for (Replacements::iterator i = replacements_.begin(); 812 i != replacements_.end(); ++i) { 813 if (i->type == SEARCH_TERMS) { 814 base::string16::size_type query_start = parsed_url_.find('?'); 815 is_in_query = query_start != base::string16::npos && 816 (static_cast<base::string16::size_type>(i->index) > query_start); 817 break; 818 } 819 } 820 821 std::string input_encoding; 822 base::string16 encoded_terms; 823 base::string16 encoded_original_query; 824 owner_->EncodeSearchTerms(search_terms_args, is_in_query, &input_encoding, 825 &encoded_terms, &encoded_original_query); 826 827 std::string url = parsed_url_; 828 829 // replacements_ is ordered in ascending order, as such we need to iterate 830 // from the back. 831 for (Replacements::reverse_iterator i = replacements_.rbegin(); 832 i != replacements_.rend(); ++i) { 833 switch (i->type) { 834 case ENCODING: 835 HandleReplacement(std::string(), input_encoding, *i, &url); 836 break; 837 838 case GOOGLE_ASSISTED_QUERY_STATS: 839 DCHECK(!i->is_post_param); 840 if (!search_terms_args.assisted_query_stats.empty()) { 841 // Get the base URL without substituting AQS to avoid infinite 842 // recursion. We need the URL to find out if it meets all 843 // AQS requirements (e.g. HTTPS protocol check). 844 // See TemplateURLRef::SearchTermsArgs for more details. 845 SearchTermsArgs search_terms_args_without_aqs(search_terms_args); 846 search_terms_args_without_aqs.assisted_query_stats.clear(); 847 GURL base_url(ReplaceSearchTerms( 848 search_terms_args_without_aqs, search_terms_data, NULL)); 849 if (base_url.SchemeIs(url::kHttpsScheme)) { 850 HandleReplacement( 851 "aqs", search_terms_args.assisted_query_stats, *i, &url); 852 } 853 } 854 break; 855 856 case GOOGLE_BASE_URL: 857 DCHECK(!i->is_post_param); 858 HandleReplacement( 859 std::string(), search_terms_data.GoogleBaseURLValue(), *i, &url); 860 break; 861 862 case GOOGLE_BASE_SUGGEST_URL: 863 DCHECK(!i->is_post_param); 864 HandleReplacement( 865 std::string(), search_terms_data.GoogleBaseSuggestURLValue(), *i, 866 &url); 867 break; 868 869 case GOOGLE_BOOKMARK_BAR_PINNED: 870 if (showing_search_terms_) { 871 // Log whether the bookmark bar is pinned when the user is seeing 872 // InstantExtended on the SRP. 873 DCHECK(!i->is_post_param); 874 HandleReplacement( 875 "bmbp", search_terms_args.bookmark_bar_pinned ? "1" : "0", *i, 876 &url); 877 } 878 break; 879 880 case GOOGLE_CURRENT_PAGE_URL: 881 DCHECK(!i->is_post_param); 882 if (!search_terms_args.current_page_url.empty()) { 883 const std::string& escaped_current_page_url = 884 net::EscapeQueryParamValue(search_terms_args.current_page_url, 885 true); 886 HandleReplacement("url", escaped_current_page_url, *i, &url); 887 } 888 break; 889 890 case GOOGLE_CURSOR_POSITION: 891 DCHECK(!i->is_post_param); 892 if (search_terms_args.cursor_position != base::string16::npos) 893 HandleReplacement( 894 "cp", 895 base::StringPrintf("%" PRIuS, search_terms_args.cursor_position), 896 *i, 897 &url); 898 break; 899 900 case GOOGLE_FORCE_INSTANT_RESULTS: 901 DCHECK(!i->is_post_param); 902 HandleReplacement(std::string(), 903 chrome::ForceInstantResultsParam( 904 search_terms_args.force_instant_results), 905 *i, 906 &url); 907 break; 908 909 case GOOGLE_INPUT_TYPE: 910 DCHECK(!i->is_post_param); 911 HandleReplacement( 912 "oit", base::IntToString(search_terms_args.input_type), *i, &url); 913 break; 914 915 case GOOGLE_INSTANT_EXTENDED_ENABLED: 916 DCHECK(!i->is_post_param); 917 HandleReplacement(std::string(), 918 chrome::InstantExtendedEnabledParam(type_ == SEARCH), 919 *i, 920 &url); 921 break; 922 923 case GOOGLE_NTP_IS_THEMED: 924 DCHECK(!i->is_post_param); 925 HandleReplacement( 926 std::string(), search_terms_data.NTPIsThemedParam(), *i, &url); 927 break; 928 929 case GOOGLE_OMNIBOX_START_MARGIN: 930 DCHECK(!i->is_post_param); 931 if (search_terms_args.omnibox_start_margin >= 0) { 932 HandleReplacement( 933 "es_sm", 934 base::IntToString(search_terms_args.omnibox_start_margin), 935 *i, 936 &url); 937 } 938 break; 939 940 case GOOGLE_CONTEXTUAL_SEARCH_VERSION: 941 if (search_terms_args.contextual_search_params.version >= 0) { 942 HandleReplacement( 943 "ctxs", 944 base::IntToString( 945 search_terms_args.contextual_search_params.version), 946 *i, 947 &url); 948 } 949 break; 950 951 case GOOGLE_CONTEXTUAL_SEARCH_CONTEXT_DATA: { 952 DCHECK(!i->is_post_param); 953 std::string context_data; 954 955 const SearchTermsArgs::ContextualSearchParams& params = 956 search_terms_args.contextual_search_params; 957 958 if (params.start != std::string::npos) { 959 context_data.append("ctxs_start=" + base::IntToString( 960 params.start) + "&"); 961 } 962 963 if (params.end != std::string::npos) { 964 context_data.append("ctxs_end=" + base::IntToString( 965 params.end) + "&"); 966 } 967 968 if (!params.selection.empty()) 969 context_data.append("q=" + params.selection + "&"); 970 971 if (!params.content.empty()) 972 context_data.append("ctxs_content=" + params.content + "&"); 973 974 if (!params.base_page_url.empty()) 975 context_data.append("ctxs_url=" + params.base_page_url + "&"); 976 977 if (!params.encoding.empty()) { 978 context_data.append("ctxs_encoding=" + params.encoding + "&"); 979 } 980 981 HandleReplacement(std::string(), context_data, *i, &url); 982 break; 983 } 984 985 case GOOGLE_ORIGINAL_QUERY_FOR_SUGGESTION: 986 DCHECK(!i->is_post_param); 987 if (search_terms_args.accepted_suggestion >= 0 || 988 !search_terms_args.assisted_query_stats.empty()) { 989 HandleReplacement( 990 "oq", base::UTF16ToUTF8(encoded_original_query), *i, &url); 991 } 992 break; 993 994 case GOOGLE_PAGE_CLASSIFICATION: 995 if (search_terms_args.page_classification != 996 metrics::OmniboxEventProto::INVALID_SPEC) { 997 HandleReplacement( 998 "pgcl", base::IntToString(search_terms_args.page_classification), 999 *i, &url); 1000 } 1001 break; 1002 1003 case GOOGLE_RLZ: { 1004 DCHECK(!i->is_post_param); 1005 // On platforms that don't have RLZ, we still want this branch 1006 // to happen so that we replace the RLZ template with the 1007 // empty string. (If we don't handle this case, we hit a 1008 // NOTREACHED below.) 1009 base::string16 rlz_string = search_terms_data.GetRlzParameterValue( 1010 search_terms_args.from_app_list); 1011 if (!rlz_string.empty()) { 1012 HandleReplacement("rlz", base::UTF16ToUTF8(rlz_string), *i, &url); 1013 } 1014 break; 1015 } 1016 1017 case GOOGLE_SEARCH_CLIENT: { 1018 DCHECK(!i->is_post_param); 1019 std::string client = search_terms_data.GetSearchClient(); 1020 if (!client.empty()) 1021 HandleReplacement("client", client, *i, &url); 1022 break; 1023 } 1024 1025 case GOOGLE_SEARCH_FIELDTRIAL_GROUP: 1026 // We are not currently running any fieldtrials that modulate the search 1027 // url. If we do, then we'd have some conditional insert such as: 1028 // url.insert(i->index, used_www ? "gcx=w&" : "gcx=c&"); 1029 break; 1030 1031 case GOOGLE_SESSION_TOKEN: { 1032 std::string token = search_terms_args.session_token; 1033 if (!token.empty()) 1034 HandleReplacement("psi", token, *i, &url); 1035 break; 1036 } 1037 1038 case GOOGLE_SUGGEST_CLIENT: 1039 HandleReplacement( 1040 std::string(), search_terms_data.GetSuggestClient(), *i, &url); 1041 break; 1042 1043 case GOOGLE_SUGGEST_REQUEST_ID: 1044 HandleReplacement( 1045 std::string(), search_terms_data.GetSuggestRequestIdentifier(), *i, 1046 &url); 1047 break; 1048 1049 case GOOGLE_UNESCAPED_SEARCH_TERMS: { 1050 std::string unescaped_terms; 1051 base::UTF16ToCodepage(search_terms_args.search_terms, 1052 input_encoding.c_str(), 1053 base::OnStringConversionError::SKIP, 1054 &unescaped_terms); 1055 HandleReplacement(std::string(), unescaped_terms, *i, &url); 1056 break; 1057 } 1058 1059 case LANGUAGE: 1060 HandleReplacement( 1061 std::string(), search_terms_data.GetApplicationLocale(), *i, &url); 1062 break; 1063 1064 case SEARCH_TERMS: 1065 HandleReplacement( 1066 std::string(), base::UTF16ToUTF8(encoded_terms), *i, &url); 1067 break; 1068 1069 case GOOGLE_IMAGE_THUMBNAIL: 1070 HandleReplacement( 1071 std::string(), search_terms_args.image_thumbnail_content, *i, &url); 1072 break; 1073 1074 case GOOGLE_IMAGE_URL: 1075 if (search_terms_args.image_url.is_valid()) { 1076 HandleReplacement( 1077 std::string(), search_terms_args.image_url.spec(), *i, &url); 1078 } 1079 break; 1080 1081 case GOOGLE_IMAGE_ORIGINAL_WIDTH: 1082 if (!search_terms_args.image_original_size.IsEmpty()) { 1083 HandleReplacement( 1084 std::string(), 1085 base::IntToString(search_terms_args.image_original_size.width()), 1086 *i, &url); 1087 } 1088 break; 1089 1090 case GOOGLE_IMAGE_ORIGINAL_HEIGHT: 1091 if (!search_terms_args.image_original_size.IsEmpty()) { 1092 HandleReplacement( 1093 std::string(), 1094 base::IntToString(search_terms_args.image_original_size.height()), 1095 *i, &url); 1096 } 1097 break; 1098 1099 case GOOGLE_IMAGE_SEARCH_SOURCE: 1100 HandleReplacement( 1101 std::string(), search_terms_data.GoogleImageSearchSource(), *i, 1102 &url); 1103 break; 1104 1105 default: 1106 NOTREACHED(); 1107 break; 1108 } 1109 } 1110 1111 if (!post_params_.empty()) 1112 EncodeFormData(post_params_, post_content); 1113 1114 return url; 1115 } 1116 1117 1118 // TemplateURL ---------------------------------------------------------------- 1119 1120 TemplateURL::TemplateURL(const TemplateURLData& data) 1121 : data_(data), 1122 url_ref_(this, TemplateURLRef::SEARCH), 1123 suggestions_url_ref_(this, 1124 TemplateURLRef::SUGGEST), 1125 instant_url_ref_(this, 1126 TemplateURLRef::INSTANT), 1127 image_url_ref_(this, TemplateURLRef::IMAGE), 1128 new_tab_url_ref_(this, TemplateURLRef::NEW_TAB), 1129 contextual_search_url_ref_(this, TemplateURLRef::CONTEXTUAL_SEARCH) { 1130 SetPrepopulateId(data_.prepopulate_id); 1131 1132 if (data_.search_terms_replacement_key == 1133 kGoogleInstantExtendedEnabledKeyFull) { 1134 data_.search_terms_replacement_key = google_util::kInstantExtendedAPIParam; 1135 } 1136 } 1137 1138 TemplateURL::~TemplateURL() { 1139 } 1140 1141 // static 1142 base::string16 TemplateURL::GenerateKeyword(const GURL& url) { 1143 DCHECK(url.is_valid()); 1144 // Strip "www." off the front of the keyword; otherwise the keyword won't work 1145 // properly. See http://code.google.com/p/chromium/issues/detail?id=6984 . 1146 // Special case: if the host was exactly "www." (not sure this can happen but 1147 // perhaps with some weird intranet and custom DNS server?), ensure we at 1148 // least don't return the empty string. 1149 base::string16 keyword(net::StripWWWFromHost(url)); 1150 return keyword.empty() ? base::ASCIIToUTF16("www") : keyword; 1151 } 1152 1153 // static 1154 GURL TemplateURL::GenerateFaviconURL(const GURL& url) { 1155 DCHECK(url.is_valid()); 1156 GURL::Replacements rep; 1157 1158 const char favicon_path[] = "/favicon.ico"; 1159 int favicon_path_len = arraysize(favicon_path) - 1; 1160 1161 rep.SetPath(favicon_path, url::Component(0, favicon_path_len)); 1162 rep.ClearUsername(); 1163 rep.ClearPassword(); 1164 rep.ClearQuery(); 1165 rep.ClearRef(); 1166 return url.ReplaceComponents(rep); 1167 } 1168 1169 // static 1170 bool TemplateURL::MatchesData(const TemplateURL* t_url, 1171 const TemplateURLData* data, 1172 const SearchTermsData& search_terms_data) { 1173 if (!t_url || !data) 1174 return !t_url && !data; 1175 1176 return (t_url->short_name() == data->short_name) && 1177 t_url->HasSameKeywordAs(*data, search_terms_data) && 1178 (t_url->url() == data->url()) && 1179 (t_url->suggestions_url() == data->suggestions_url) && 1180 (t_url->instant_url() == data->instant_url) && 1181 (t_url->image_url() == data->image_url) && 1182 (t_url->new_tab_url() == data->new_tab_url) && 1183 (t_url->search_url_post_params() == data->search_url_post_params) && 1184 (t_url->suggestions_url_post_params() == 1185 data->suggestions_url_post_params) && 1186 (t_url->instant_url_post_params() == data->instant_url_post_params) && 1187 (t_url->image_url_post_params() == data->image_url_post_params) && 1188 (t_url->favicon_url() == data->favicon_url) && 1189 (t_url->safe_for_autoreplace() == data->safe_for_autoreplace) && 1190 (t_url->show_in_default_list() == data->show_in_default_list) && 1191 (t_url->input_encodings() == data->input_encodings) && 1192 (t_url->alternate_urls() == data->alternate_urls) && 1193 (t_url->search_terms_replacement_key() == 1194 data->search_terms_replacement_key); 1195 } 1196 1197 base::string16 TemplateURL::AdjustedShortNameForLocaleDirection() const { 1198 base::string16 bidi_safe_short_name = data_.short_name; 1199 base::i18n::AdjustStringForLocaleDirection(&bidi_safe_short_name); 1200 return bidi_safe_short_name; 1201 } 1202 1203 bool TemplateURL::ShowInDefaultList( 1204 const SearchTermsData& search_terms_data) const { 1205 return data_.show_in_default_list && 1206 url_ref_.SupportsReplacement(search_terms_data); 1207 } 1208 1209 bool TemplateURL::SupportsReplacement( 1210 const SearchTermsData& search_terms_data) const { 1211 return url_ref_.SupportsReplacement(search_terms_data); 1212 } 1213 1214 bool TemplateURL::HasGoogleBaseURLs( 1215 const SearchTermsData& search_terms_data) const { 1216 return url_ref_.HasGoogleBaseURLs(search_terms_data) || 1217 suggestions_url_ref_.HasGoogleBaseURLs(search_terms_data) || 1218 instant_url_ref_.HasGoogleBaseURLs(search_terms_data) || 1219 image_url_ref_.HasGoogleBaseURLs(search_terms_data) || 1220 new_tab_url_ref_.HasGoogleBaseURLs(search_terms_data); 1221 } 1222 1223 bool TemplateURL::IsGoogleSearchURLWithReplaceableKeyword( 1224 const SearchTermsData& search_terms_data) const { 1225 return (GetType() == NORMAL) && 1226 url_ref_.HasGoogleBaseURLs(search_terms_data) && 1227 google_util::IsGoogleHostname(base::UTF16ToUTF8(data_.keyword()), 1228 google_util::DISALLOW_SUBDOMAIN); 1229 } 1230 1231 bool TemplateURL::HasSameKeywordAs( 1232 const TemplateURLData& other, 1233 const SearchTermsData& search_terms_data) const { 1234 return (data_.keyword() == other.keyword()) || 1235 (IsGoogleSearchURLWithReplaceableKeyword(search_terms_data) && 1236 TemplateURL(other).IsGoogleSearchURLWithReplaceableKeyword( 1237 search_terms_data)); 1238 } 1239 1240 TemplateURL::Type TemplateURL::GetType() const { 1241 if (extension_info_) 1242 return NORMAL_CONTROLLED_BY_EXTENSION; 1243 return GURL(data_.url()).SchemeIs(extensions::kExtensionScheme) ? 1244 OMNIBOX_API_EXTENSION : NORMAL; 1245 } 1246 1247 std::string TemplateURL::GetExtensionId() const { 1248 DCHECK_NE(NORMAL, GetType()); 1249 return extension_info_ ? 1250 extension_info_->extension_id : GURL(data_.url()).host(); 1251 } 1252 1253 size_t TemplateURL::URLCount() const { 1254 // Add 1 for the regular search URL. 1255 return data_.alternate_urls.size() + 1; 1256 } 1257 1258 const std::string& TemplateURL::GetURL(size_t index) const { 1259 DCHECK_LT(index, URLCount()); 1260 1261 return (index < data_.alternate_urls.size()) ? 1262 data_.alternate_urls[index] : url(); 1263 } 1264 1265 bool TemplateURL::ExtractSearchTermsFromURL( 1266 const GURL& url, 1267 const SearchTermsData& search_terms_data, 1268 base::string16* search_terms) { 1269 return FindSearchTermsInURL(url, search_terms_data, search_terms, NULL, NULL); 1270 } 1271 1272 bool TemplateURL::IsSearchURL( 1273 const GURL& url, 1274 const SearchTermsData& search_terms_data) { 1275 base::string16 search_terms; 1276 return ExtractSearchTermsFromURL(url, search_terms_data, &search_terms) && 1277 !search_terms.empty(); 1278 } 1279 1280 bool TemplateURL::HasSearchTermsReplacementKey(const GURL& url) const { 1281 // Look for the key both in the query and the ref. 1282 std::string params[] = {url.query(), url.ref()}; 1283 1284 for (int i = 0; i < 2; ++i) { 1285 url::Component query, key, value; 1286 query.len = static_cast<int>(params[i].size()); 1287 while (url::ExtractQueryKeyValue(params[i].c_str(), &query, &key, &value)) { 1288 if (key.is_nonempty() && 1289 params[i].substr(key.begin, key.len) == 1290 search_terms_replacement_key()) { 1291 return true; 1292 } 1293 } 1294 } 1295 return false; 1296 } 1297 1298 bool TemplateURL::ReplaceSearchTermsInURL( 1299 const GURL& url, 1300 const TemplateURLRef::SearchTermsArgs& search_terms_args, 1301 const SearchTermsData& search_terms_data, 1302 GURL* result) { 1303 // TODO(beaudoin): Use AQS from |search_terms_args| too. 1304 url::Parsed::ComponentType search_term_component; 1305 url::Component search_terms_position; 1306 base::string16 search_terms; 1307 if (!FindSearchTermsInURL(url, search_terms_data, &search_terms, 1308 &search_term_component, &search_terms_position)) { 1309 return false; 1310 } 1311 DCHECK(search_terms_position.is_nonempty()); 1312 1313 // FindSearchTermsInURL only returns true for search terms in the query or 1314 // ref, so we can call EncodeSearchTerm with |is_in_query| = true, since query 1315 // and ref are encoded in the same way. 1316 std::string input_encoding; 1317 base::string16 encoded_terms; 1318 base::string16 encoded_original_query; 1319 EncodeSearchTerms(search_terms_args, true, &input_encoding, 1320 &encoded_terms, &encoded_original_query); 1321 1322 std::string old_params( 1323 (search_term_component == url::Parsed::REF) ? url.ref() : url.query()); 1324 std::string new_params(old_params, 0, search_terms_position.begin); 1325 new_params += base::UTF16ToUTF8(search_terms_args.search_terms); 1326 new_params += old_params.substr(search_terms_position.end()); 1327 url::StdStringReplacements<std::string> replacements; 1328 if (search_term_component == url::Parsed::REF) 1329 replacements.SetRefStr(new_params); 1330 else 1331 replacements.SetQueryStr(new_params); 1332 *result = url.ReplaceComponents(replacements); 1333 return true; 1334 } 1335 1336 void TemplateURL::EncodeSearchTerms( 1337 const TemplateURLRef::SearchTermsArgs& search_terms_args, 1338 bool is_in_query, 1339 std::string* input_encoding, 1340 base::string16* encoded_terms, 1341 base::string16* encoded_original_query) const { 1342 1343 std::vector<std::string> encodings(input_encodings()); 1344 if (std::find(encodings.begin(), encodings.end(), "UTF-8") == encodings.end()) 1345 encodings.push_back("UTF-8"); 1346 for (std::vector<std::string>::const_iterator i(encodings.begin()); 1347 i != encodings.end(); ++i) { 1348 if (TryEncoding(search_terms_args.search_terms, 1349 search_terms_args.original_query, i->c_str(), 1350 is_in_query, encoded_terms, encoded_original_query)) { 1351 *input_encoding = *i; 1352 return; 1353 } 1354 } 1355 NOTREACHED(); 1356 } 1357 1358 GURL TemplateURL::GenerateSearchURL( 1359 const SearchTermsData& search_terms_data) const { 1360 if (!url_ref_.IsValid(search_terms_data)) 1361 return GURL(); 1362 1363 if (!url_ref_.SupportsReplacement(search_terms_data)) 1364 return GURL(url()); 1365 1366 // Use something obscure for the search terms argument so that in the rare 1367 // case the term replaces the URL it's unlikely another keyword would have the 1368 // same url. 1369 // TODO(jnd): Add additional parameters to get post data when the search URL 1370 // has post parameters. 1371 return GURL(url_ref_.ReplaceSearchTerms( 1372 TemplateURLRef::SearchTermsArgs( 1373 base::ASCIIToUTF16("blah.blah.blah.blah.blah")), 1374 search_terms_data, NULL)); 1375 } 1376 1377 void TemplateURL::CopyFrom(const TemplateURL& other) { 1378 if (this == &other) 1379 return; 1380 1381 data_ = other.data_; 1382 url_ref_.InvalidateCachedValues(); 1383 suggestions_url_ref_.InvalidateCachedValues(); 1384 instant_url_ref_.InvalidateCachedValues(); 1385 SetPrepopulateId(other.data_.prepopulate_id); 1386 } 1387 1388 void TemplateURL::SetURL(const std::string& url) { 1389 data_.SetURL(url); 1390 url_ref_.InvalidateCachedValues(); 1391 } 1392 1393 void TemplateURL::SetPrepopulateId(int id) { 1394 data_.prepopulate_id = id; 1395 const bool prepopulated = id > 0; 1396 url_ref_.prepopulated_ = prepopulated; 1397 suggestions_url_ref_.prepopulated_ = prepopulated; 1398 instant_url_ref_.prepopulated_ = prepopulated; 1399 } 1400 1401 void TemplateURL::ResetKeywordIfNecessary( 1402 const SearchTermsData& search_terms_data, 1403 bool force) { 1404 if (IsGoogleSearchURLWithReplaceableKeyword(search_terms_data) || force) { 1405 DCHECK(GetType() != OMNIBOX_API_EXTENSION); 1406 GURL url(GenerateSearchURL(search_terms_data)); 1407 if (url.is_valid()) 1408 data_.SetKeyword(GenerateKeyword(url)); 1409 } 1410 } 1411 1412 bool TemplateURL::FindSearchTermsInURL( 1413 const GURL& url, 1414 const SearchTermsData& search_terms_data, 1415 base::string16* search_terms, 1416 url::Parsed::ComponentType* search_term_component, 1417 url::Component* search_terms_position) { 1418 DCHECK(search_terms); 1419 search_terms->clear(); 1420 1421 // Try to match with every pattern. 1422 for (size_t i = 0; i < URLCount(); ++i) { 1423 TemplateURLRef ref(this, i); 1424 if (ref.ExtractSearchTermsFromURL(url, search_terms, search_terms_data, 1425 search_term_component, search_terms_position)) { 1426 // If ExtractSearchTermsFromURL() returns true and |search_terms| is empty 1427 // it means the pattern matched but no search terms were present. In this 1428 // case we fail immediately without looking for matches in subsequent 1429 // patterns. This means that given patterns 1430 // [ "http://foo/#q={searchTerms}", "http://foo/?q={searchTerms}" ], 1431 // calling ExtractSearchTermsFromURL() on "http://foo/?q=bar#q=' would 1432 // return false. This is important for at least Google, where such URLs 1433 // are invalid. 1434 return !search_terms->empty(); 1435 } 1436 } 1437 return false; 1438 } 1439