1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
|
// Copyright 2014 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#ifndef COMPONENTS_SEARCH_ENGINES_TEMPLATE_URL_H_
#define COMPONENTS_SEARCH_ENGINES_TEMPLATE_URL_H_
#include <cstddef>
#include <memory>
#include <string>
#include <utility>
#include <vector>
#include "base/gtest_prod_util.h"
#include "base/macros.h"
#include "base/time/time.h"
#include "components/search_engines/omnibox_focus_type.h"
#include "components/search_engines/search_engine_type.h"
#include "components/search_engines/template_url_data.h"
#include "components/search_engines/template_url_id.h"
#include "third_party/metrics_proto/omnibox_event.pb.h"
#include "third_party/metrics_proto/omnibox_input_type.pb.h"
#include "ui/gfx/geometry/size.h"
#include "url/gurl.h"
#include "url/third_party/mozilla/url_parse.h"
class SearchTermsData;
class TemplateURL;
// TemplateURLRef -------------------------------------------------------------
// A TemplateURLRef represents a single URL within the larger TemplateURL class
// (which represents an entire "search engine", see below). If
// SupportsReplacement() is true, this URL has placeholders in it, for which
// callers can substitute values to get a "real" URL using ReplaceSearchTerms().
//
// TemplateURLRefs always have a non-NULL |owner_| TemplateURL, which they
// access in order to get at important data like the underlying URL string or
// the associated Profile.
class TemplateURLRef {
public:
// Magic numbers to pass to ReplaceSearchTerms() for the |accepted_suggestion|
// parameter. Most callers aren't using Suggest capabilities and should just
// pass NO_SUGGESTIONS_AVAILABLE.
// NOTE: Because positive values are meaningful, make sure these are negative!
enum AcceptedSuggestion {
NO_SUGGESTION_CHOSEN = -1,
NO_SUGGESTIONS_AVAILABLE = -2,
};
// Which kind of URL within our owner we are. This allows us to get at the
// correct string field. Use |INDEXED| to indicate that the numerical
// |index_in_owner_| should be used instead.
enum Type {
SEARCH,
SUGGEST,
IMAGE,
NEW_TAB,
CONTEXTUAL_SEARCH,
INDEXED
};
// Type to store <content_type, post_data> pair for POST URLs.
// The |content_type|(first part of the pair) is the content-type of
// the |post_data|(second part of the pair) which is encoded in
// "multipart/form-data" format, it also contains the MIME boundary used in
// the |post_data|. See http://tools.ietf.org/html/rfc2046 for the details.
typedef std::pair<std::string, std::string> PostContent;
// Enumeration of the known search or suggest request sources.
enum RequestSource {
SEARCHBOX, // Omnibox or the NTP realbox. The default.
CROS_APP_LIST, // Chrome OS app list search box.
NON_SEARCHBOX_NTP, // Non-searchbox NTP surfaces.
};
// This struct encapsulates arguments passed to
// TemplateURLRef::ReplaceSearchTerms methods. By default, only search_terms
// is required and is passed in the constructor.
struct SearchTermsArgs {
SearchTermsArgs();
explicit SearchTermsArgs(const base::string16& search_terms);
SearchTermsArgs(const SearchTermsArgs& other);
~SearchTermsArgs();
struct ContextualSearchParams {
ContextualSearchParams();
// Modern constructor, used when the content is sent in the HTTP header
// instead of as CGI parameters.
// The |version| tell the server which version of the client is making
// this request.
// The |contextual_cards_version| tells the server which version of
// contextual cards integration is being used by the client.
// The |home_country| is an ISO country code for the country that the user
// considers their permanent home (which may be different from the country
// they are currently visiting). Pass an empty string if none available.
// The |previous_event_id| is an identifier previously returned by the
// server to identify that user interaction.
// The |previous_event_results| are the results of the user-interaction of
// that previous request.
// The "previous_xyz" parameters are documented in go/cs-sanitized.
// The |is_exact_search| allows the search request to be narrowed down to
// an "exact" search only, meaning just search for X rather than X +
// whatever else is in the context. The returned search term should not
// be expanded, and the server will honor this along with creating a
// narrow Search Term.
// The |source_lang| specifies a source language hint to apply for
// translation or to indicate that translation might be appropriate.
// This comes from CLD evaluating the selection and/or page content.
// The |target_lang| specifies the best language to translate into for
// the user, which also indicates when translation is appropriate or
// helpful. This comes from the Chrome Language Model.
// The |fluent_languages| string specifies the languages the user
// is fluent in reading. This acts as an alternate set of languages
// to consider translating into. The languages are ordered by
// fluency, and encoded as a comma-separated list of BCP 47 languages.
// The |related_searches_stamp| string contains an information that
// indicates experiment status and server processing results so that
// can be logged in GWS Sawmill logs for offline analysis for the
// Related Searches MVP experiment.
ContextualSearchParams(int version,
int contextual_cards_version,
std::string home_country,
int64_t previous_event_id,
int previous_event_results,
bool is_exact_search,
std::string source_lang,
std::string target_lang,
std::string fluent_languages,
std::string related_searches_stamp);
ContextualSearchParams(const ContextualSearchParams& other);
~ContextualSearchParams();
// Estimates dynamic memory usage.
// See base/trace_event/memory_usage_estimator.h for more info.
size_t EstimateMemoryUsage() const;
// The version of contextual search.
int version = -1;
// The version of Contextual Cards data to request.
// A value of 0 indicates no data needed.
int contextual_cards_version = 0;
// The locale of the user's home country in an ISO country code format,
// or an empty string if not available. This indicates where the user
// resides, not where they currently are.
std::string home_country;
// An EventID from a previous interaction (sent by server, recorded by
// client).
int64_t previous_event_id = 0l;
// An encoded set of booleans that represent the interaction results from
// the previous event.
int previous_event_results = 0;
// A flag that restricts the search to exactly match the selection rather
// than expanding the Search Term to include other words in the context.
bool is_exact_search = false;
// Source language string to translate from.
std::string source_lang;
// Target language string to be translated into.
std::string target_lang;
// Alternate target languages that the user is fluent in, encoded in a
// single string.
std::string fluent_languages;
// Experiment arm and processing information for the Related Searches
// experiment. The value is an arbitrary string that starts with a
// schema version number.
std::string related_searches_stamp;
};
// Estimates dynamic memory usage.
// See base/trace_event/memory_usage_estimator.h for more info.
size_t EstimateMemoryUsage() const;
// The search terms (query).
base::string16 search_terms;
// The original (input) query.
base::string16 original_query;
// The type the original input query was identified as.
metrics::OmniboxInputType input_type = metrics::OmniboxInputType::EMPTY;
// Specifies how the user last interacted with the searchbox UI element.
OmniboxFocusType focus_type = OmniboxFocusType::DEFAULT;
// The optional assisted query stats, aka AQS, used for logging purposes.
// This string contains impressions of all autocomplete matches shown
// at the query submission time. For privacy reasons, we require the
// search provider to support HTTPS protocol in order to receive the AQS
// param.
// For more details, see http://goto.google.com/binary-clients-logging .
std::string assisted_query_stats;
// TODO: Remove along with "aq" CGI param.
int accepted_suggestion = NO_SUGGESTIONS_AVAILABLE;
// The 0-based position of the cursor within the query string at the time
// the request was issued. Set to base::string16::npos if not used.
size_t cursor_position = base::string16::npos;
// The URL of the current webpage to be used for experimental zero-prefix
// suggestions.
std::string current_page_url;
// Which omnibox the user used to type the prefix.
metrics::OmniboxEventProto::PageClassification page_classification =
metrics::OmniboxEventProto::INVALID_SPEC;
// Optional session token.
std::string session_token;
// Prefetch query and type.
std::string prefetch_query;
std::string prefetch_query_type;
// Additional query params to append to the request.
std::string additional_query_params;
// If set, ReplaceSearchTerms() will automatically append any extra query
// params specified via the --extra-search-query-params command-line
// argument. Generally, this should be set when dealing with the search
// TemplateURLRefs of the default search engine and the caller cares
// about the query portion of the URL. Since neither TemplateURLRef nor
// indeed TemplateURL know whether a TemplateURL is the default search
// engine, callers instead must set this manually.
bool append_extra_query_params_from_command_line = false;
// The raw content of an image thumbnail that will be used as a query for
// search-by-image frontend.
std::string image_thumbnail_content;
// When searching for an image, the URL of the original image. Callers
// should leave this empty for images specified via data: URLs.
GURL image_url;
// When searching for an image, the original size of the image.
gfx::Size image_original_size;
// Source of the search or suggest request.
RequestSource request_source = SEARCHBOX;
ContextualSearchParams contextual_search_params;
};
TemplateURLRef(const TemplateURL* owner, Type type);
TemplateURLRef(const TemplateURL* owner, size_t index_in_owner);
~TemplateURLRef();
TemplateURLRef(const TemplateURLRef& source);
TemplateURLRef& operator=(const TemplateURLRef& source);
// Returns the raw URL. None of the parameters will have been replaced.
std::string GetURL() const;
// Returns the raw string of the post params. Please see comments in
// prepopulated_engines_schema.json for the format.
std::string GetPostParamsString() const;
// Returns true if this URL supports search term replacement.
bool SupportsReplacement(const SearchTermsData& search_terms_data) const;
// Returns a string that is the result of replacing the search terms in
// the url with the specified arguments. We use our owner's input encoding.
//
// If this TemplateURLRef does not support replacement (SupportsReplacement
// returns false), an empty string is returned.
// If this TemplateURLRef uses POST, and |post_content| is not NULL, the
// |post_params_| will be replaced, encoded in "multipart/form-data" format
// and stored into |post_content|.
std::string ReplaceSearchTerms(const SearchTermsArgs& search_terms_args,
const SearchTermsData& search_terms_data,
PostContent* post_content) const;
// TODO(jnd): remove the following ReplaceSearchTerms definition which does
// not have |post_content| parameter once all reference callers pass
// |post_content| parameter.
std::string ReplaceSearchTerms(
const SearchTermsArgs& search_terms_args,
const SearchTermsData& search_terms_data) const {
return ReplaceSearchTerms(search_terms_args, search_terms_data, NULL);
}
// Returns true if the TemplateURLRef is valid. An invalid TemplateURLRef is
// one that contains unknown terms, or invalid characters.
bool IsValid(const SearchTermsData& search_terms_data) const;
// Returns a string representation of this TemplateURLRef suitable for
// display. The display format is the same as the format used by Firefox.
base::string16 DisplayURL(const SearchTermsData& search_terms_data) const;
// Converts a string as returned by DisplayURL back into a string as
// understood by TemplateURLRef.
static std::string DisplayURLToURLRef(const base::string16& display_url);
// If this TemplateURLRef is valid and contains one search term, this returns
// the host/path of the URL, otherwise this returns an empty string.
const std::string& GetHost(const SearchTermsData& search_terms_data) const;
std::string GetPath(const SearchTermsData& search_terms_data) const;
// If this TemplateURLRef is valid and contains one search term
// in its query or ref, this returns the key of the search term,
// otherwise this returns an empty string.
const std::string& GetSearchTermKey(
const SearchTermsData& search_terms_data) const;
// If this TemplateURLRef is valid and contains one search term,
// this returns the location of the search term,
// otherwise this returns url::Parsed::QUERY.
url::Parsed::ComponentType GetSearchTermKeyLocation(
const SearchTermsData& search_terms_data) const;
// If this TemplateURLRef is valid and contains one search term,
// this returns the fixed prefix before the search term,
// otherwise this returns an empty string.
const std::string& GetSearchTermValuePrefix(
const SearchTermsData& search_terms_data) const;
// If this TemplateURLRef is valid and contains one search term,
// this returns the fixed suffix after the search term,
// otherwise this returns an empty string.
const std::string& GetSearchTermValueSuffix(
const SearchTermsData& search_terms_data) const;
// Converts the specified term in our owner's encoding to a base::string16.
base::string16 SearchTermToString16(const base::StringPiece& term) const;
// Returns true if this TemplateURLRef has a replacement term of
// {google:baseURL} or {google:baseSuggestURL}.
bool HasGoogleBaseURLs(const SearchTermsData& search_terms_data) const;
// Use the pattern referred to by this TemplateURLRef to match the provided
// |url| and extract |search_terms| from it. Returns true if the pattern
// matches, even if |search_terms| is empty. In this case
// |search_term_component|, if not NULL, indicates whether the search terms
// were found in the query or the ref parameters; and |search_terms_position|,
// if not NULL, contains the position of the search terms in the query or the
// ref parameters. Returns false and an empty |search_terms| if the pattern
// does not match.
bool ExtractSearchTermsFromURL(
const GURL& url,
base::string16* search_terms,
const SearchTermsData& search_terms_data,
url::Parsed::ComponentType* search_term_component,
url::Component* search_terms_position) const;
// Whether the URL uses POST (as opposed to GET).
bool UsesPOSTMethod(const SearchTermsData& search_terms_data) const;
// Estimates dynamic memory usage.
// See base/trace_event/memory_usage_estimator.h for more info.
size_t EstimateMemoryUsage() const;
private:
friend class TemplateURL;
friend class TemplateURLTest;
FRIEND_TEST_ALL_PREFIXES(TemplateURLTest, SetPrepopulatedAndParse);
FRIEND_TEST_ALL_PREFIXES(TemplateURLTest, ParseParameterKnown);
FRIEND_TEST_ALL_PREFIXES(TemplateURLTest, ParseParameterUnknown);
FRIEND_TEST_ALL_PREFIXES(TemplateURLTest, ParseURLEmpty);
FRIEND_TEST_ALL_PREFIXES(TemplateURLTest, ParseURLNoTemplateEnd);
FRIEND_TEST_ALL_PREFIXES(TemplateURLTest, ParseURLNoKnownParameters);
FRIEND_TEST_ALL_PREFIXES(TemplateURLTest, ParseURLTwoParameters);
FRIEND_TEST_ALL_PREFIXES(TemplateURLTest, ParseURLNestedParameter);
FRIEND_TEST_ALL_PREFIXES(TemplateURLTest, URLRefTestImageURLWithPOST);
// Enumeration of the known types.
enum ReplacementType {
ENCODING,
GOOGLE_ASSISTED_QUERY_STATS,
GOOGLE_BASE_URL,
GOOGLE_BASE_SUGGEST_URL,
GOOGLE_CONTEXTUAL_SEARCH_VERSION,
GOOGLE_CONTEXTUAL_SEARCH_CONTEXT_DATA,
GOOGLE_CURRENT_PAGE_URL,
GOOGLE_CURSOR_POSITION,
GOOGLE_IMAGE_ORIGINAL_HEIGHT,
GOOGLE_IMAGE_ORIGINAL_WIDTH,
GOOGLE_IMAGE_SEARCH_SOURCE,
GOOGLE_IMAGE_THUMBNAIL,
GOOGLE_IMAGE_THUMBNAIL_BASE64,
GOOGLE_IMAGE_URL,
GOOGLE_INPUT_TYPE,
GOOGLE_IOS_SEARCH_LANGUAGE,
GOOGLE_NTP_IS_THEMED,
GOOGLE_OMNIBOX_FOCUS_TYPE,
GOOGLE_ORIGINAL_QUERY_FOR_SUGGESTION,
GOOGLE_PAGE_CLASSIFICATION,
GOOGLE_PREFETCH_QUERY,
GOOGLE_RLZ,
GOOGLE_SEARCH_CLIENT,
GOOGLE_SEARCH_FIELDTRIAL_GROUP,
GOOGLE_SEARCH_VERSION,
GOOGLE_SESSION_TOKEN,
GOOGLE_SUGGEST_CLIENT,
GOOGLE_SUGGEST_REQUEST_ID,
GOOGLE_UNESCAPED_SEARCH_TERMS,
LANGUAGE,
MAIL_RU_REFERRAL_ID,
SEARCH_TERMS,
YANDEX_REFERRAL_ID,
};
// Used to identify an element of the raw url that can be replaced.
struct Replacement {
Replacement(ReplacementType type, size_t index)
: type(type), index(index), is_post_param(false) {}
ReplacementType type;
size_t index;
// Indicates the location in where the replacement is replaced. If
// |is_post_param| is false, |index| indicates the byte position in
// |parsed_url_|. Otherwise, |index| is the index of |post_params_|.
bool is_post_param;
};
// Stores a single parameter for a POST.
struct PostParam {
std::string name;
std::string value;
std::string content_type;
// Estimates dynamic memory usage.
// See base/trace_event/memory_usage_estimator.h for more info.
size_t EstimateMemoryUsage() const;
};
// The list of elements to replace.
typedef std::vector<struct Replacement> Replacements;
typedef std::vector<PostParam> PostParams;
// TemplateURLRef internally caches values to make replacement quick. This
// method invalidates any cached values.
void InvalidateCachedValues() const;
// Parses the parameter in url at the specified offset. start/end specify the
// range of the parameter in the url, including the braces. If the parameter
// is valid, url is updated to reflect the appropriate parameter. If
// the parameter is one of the known parameters an element is added to
// replacements indicating the type and range of the element. The original
// parameter is erased from the url.
//
// If the parameter is not a known parameter, false is returned. If this is a
// prepopulated URL, the parameter is erased, otherwise it is left alone.
bool ParseParameter(size_t start,
size_t end,
std::string* url,
Replacements* replacements) const;
// Parses the specified url, replacing parameters as necessary. If
// successful, valid is set to true, and the parsed url is returned. For all
// known parameters that are encountered an entry is added to replacements.
// If there is an error parsing the url, valid is set to false, and an empty
// string is returned. If the URL has the POST parameters, they will be
// parsed into |post_params| which will be further replaced with real search
// terms data and encoded in "multipart/form-data" format to generate the
// POST data.
std::string ParseURL(const std::string& url,
Replacements* replacements,
PostParams* post_params,
bool* valid) const;
// If the url has not yet been parsed, ParseURL is invoked.
// NOTE: While this is const, it modifies parsed_, valid_, parsed_url_ and
// search_offset_.
void ParseIfNecessary(const SearchTermsData& search_terms_data) const;
// Parses a wildcard out of |path|, putting the parsed path in |path_prefix_|
// and |path_suffix_| and setting |path_wildcard_present_| to true.
// In the absence of a wildcard, the full path will be contained in
// |path_prefix_| and |path_wildcard_present_| will be false.
void ParsePath(const std::string& path) const;
// Returns whether the path portion of this template URL is equal to the path
// in |url|, checking that URL is prefixed/suffixed by
// |path_prefix_|/|path_suffix_| if |path_wildcard_present_| is true, or equal
// to |path_prefix_| otherwise.
bool PathIsEqual(const GURL& url) const;
// Extracts the query key and host from the url.
void ParseHostAndSearchTermKey(
const SearchTermsData& search_terms_data) const;
// Encode post parameters in "multipart/form-data" format and store it
// inside |post_content|. Returns false if errors are encountered during
// encoding. This method is called each time ReplaceSearchTerms gets called.
bool EncodeFormData(const PostParams& post_params,
PostContent* post_content) const;
// Handles a replacement by using real term data. If the replacement
// belongs to a PostParam, the PostParam will be replaced by the term data.
// Otherwise, the term data will be inserted at the place that the
// replacement points to.
void HandleReplacement(const std::string& name,
const std::string& value,
const Replacement& replacement,
std::string* url) const;
// Replaces all replacements in |parsed_url_| with their actual values and
// returns the result. This is the main functionality of
// ReplaceSearchTerms().
std::string HandleReplacements(
const SearchTermsArgs& search_terms_args,
const SearchTermsData& search_terms_data,
PostContent* post_content) const;
// The TemplateURL that contains us. This should outlive us.
const TemplateURL* owner_;
// What kind of URL we are.
Type type_;
// If |type_| is |INDEXED|, this |index_in_owner_| is used instead to refer to
// a url within our owner.
size_t index_in_owner_ = 0;
// Whether the URL has been parsed.
mutable bool parsed_ = false;
// Whether the url was successfully parsed.
mutable bool valid_ = false;
// The parsed URL. All terms have been stripped out of this with
// replacements_ giving the index of the terms to replace.
mutable std::string parsed_url_;
// Do we support search term replacement?
mutable bool supports_replacements_ = false;
// The replaceable parts of url (parsed_url_). These are ordered by index
// into the string, and may be empty.
mutable Replacements replacements_;
// Whether the path contains a wildcard.
mutable bool path_wildcard_present_ = false;
// Host, port, path, key and location of the search term. These are only set
// if the url contains one search term.
mutable std::string host_;
mutable std::string port_;
mutable std::string path_prefix_;
mutable std::string path_suffix_;
mutable std::string search_term_key_;
mutable url::Parsed::ComponentType search_term_key_location_ =
url::Parsed::QUERY;
mutable std::string search_term_value_prefix_;
mutable std::string search_term_value_suffix_;
mutable PostParams post_params_;
// Whether the contained URL is a pre-populated URL.
bool prepopulated_ = false;
};
// TemplateURL ----------------------------------------------------------------
// A TemplateURL represents a single "search engine", defined primarily as a
// subset of the Open Search Description Document
// (http://www.opensearch.org/Specifications/OpenSearch) plus some extensions.
// One TemplateURL contains several TemplateURLRefs, which correspond to various
// different capabilities (e.g. doing searches or getting suggestions), as well
// as a TemplateURLData containing other details like the name, keyword, etc.
//
// TemplateURLs are intended to be read-only for most users.
// The TemplateURLService, which handles storing and manipulating TemplateURLs,
// is made a friend so that it can be the exception to this pattern.
class TemplateURL {
public:
using TemplateURLVector = std::vector<TemplateURL*>;
using OwnedTemplateURLVector = std::vector<std::unique_ptr<TemplateURL>>;
// These values are not persisted and can be freely changed.
// Their integer values are used for choosing the best engine during keyword
// conflicts, so their relative ordering should not be changed without careful
// thought about what happens during version skew.
enum Type {
// Installed only on this device. Should not be synced. This is not common.
LOCAL = 0,
// Regular search engine. This is the most common.
NORMAL = 1,
// Installed by extension through Override Settings API.
NORMAL_CONTROLLED_BY_EXTENSION = 2,
// The keyword associated with an extension that uses the Omnibox API.
OMNIBOX_API_EXTENSION = 3,
};
// An AssociatedExtensionInfo represents information about the extension that
// added the search engine.
struct AssociatedExtensionInfo {
AssociatedExtensionInfo(const std::string& extension_id,
base::Time install_time,
bool wants_to_be_default_engine);
~AssociatedExtensionInfo();
// Estimates dynamic memory usage.
// See base/trace_event/memory_usage_estimator.h for more info.
size_t EstimateMemoryUsage() const;
std::string extension_id;
// Used to resolve conflicts when there are multiple extensions specifying
// the default search engine. The most recently-installed wins.
base::Time install_time;
// Whether the search engine is supposed to be default.
bool wants_to_be_default_engine;
};
explicit TemplateURL(const TemplateURLData& data, Type type = NORMAL);
// Constructor for extension controlled engine. |type| must be
// NORMAL_CONTROLLED_BY_EXTENSION or OMNIBOX_API_EXTENSION.
TemplateURL(const TemplateURLData& data,
Type type,
std::string extension_id,
base::Time install_time,
bool wants_to_be_default_engine);
~TemplateURL();
// For two engines with the same keyword, |this| and |other|,
// returns true if |this| is strictly better than |other|.
//
// While normal engines must all have distinct keywords, policy-created,
// extension-controlled and omnibox API engines may have the same keywords as
// each other or as normal engines. In these cases, policy-create engines
// override omnibox API engines, which override extension-controlled engines,
// which override normal engines.
//
// If there is still a conflict after this, compare by safe-for-autoreplace,
// then last modified date, then use the sync guid as a tiebreaker.
//
// TODO(tommycli): I'd like to use this to resolve Sync conflicts in the
// future, but we need a total ordering of TemplateURLs. That's not the case
// today, because the sync GUIDs are not actually globally unique, so there
// can be a genuine tie, which is not good, because then two different clients
// could choose to resolve the conflict in two different ways.
bool IsBetterThanEngineWithConflictingKeyword(const TemplateURL* other) const;
// Generates a suitable keyword for the specified url, which must be valid.
// This is guaranteed not to return an empty string, since TemplateURLs should
// never have an empty keyword.
static base::string16 GenerateKeyword(const GURL& url);
// Generates a favicon URL from the specified url.
static GURL GenerateFaviconURL(const GURL& url);
// Returns true if |t_url| and |data| are equal in all meaningful respects.
// Static to allow either or both params to be NULL.
static bool MatchesData(const TemplateURL* t_url,
const TemplateURLData* data,
const SearchTermsData& search_terms_data);
const TemplateURLData& data() const { return data_; }
const base::string16& short_name() const { return data_.short_name(); }
// An accessor for the short_name, but adjusted so it can be appropriately
// displayed even if it is LTR and the UI is RTL.
base::string16 AdjustedShortNameForLocaleDirection() const;
const base::string16& keyword() const { return data_.keyword(); }
const std::string& url() const { return data_.url(); }
const std::string& suggestions_url() const { return data_.suggestions_url; }
const std::string& image_url() const { return data_.image_url; }
const std::string& new_tab_url() const { return data_.new_tab_url; }
const std::string& contextual_search_url() const {
return data_.contextual_search_url;
}
const std::string& search_url_post_params() const {
return data_.search_url_post_params;
}
const std::string& suggestions_url_post_params() const {
return data_.suggestions_url_post_params;
}
const std::string& image_url_post_params() const {
return data_.image_url_post_params;
}
const std::vector<std::string>& alternate_urls() const {
return data_.alternate_urls;
}
const GURL& favicon_url() const { return data_.favicon_url; }
const GURL& logo_url() const { return data_.logo_url; }
const GURL& doodle_url() const { return data_.doodle_url; }
const GURL& originating_url() const { return data_.originating_url; }
bool safe_for_autoreplace() const { return data_.safe_for_autoreplace; }
const std::vector<std::string>& input_encodings() const {
return data_.input_encodings;
}
TemplateURLID id() const { return data_.id; }
base::Time date_created() const { return data_.date_created; }
base::Time last_modified() const { return data_.last_modified; }
base::Time last_visited() const { return data_.last_visited; }
bool created_by_policy() const { return data_.created_by_policy; }
bool created_from_play_api() const { return data_.created_from_play_api; }
int usage_count() const { return data_.usage_count; }
int prepopulate_id() const { return data_.prepopulate_id; }
const std::string& sync_guid() const { return data_.sync_guid; }
const std::vector<TemplateURLRef>& url_refs() const { return url_refs_; }
const TemplateURLRef& url_ref() const {
// Sanity check for https://crbug.com/781703.
CHECK(!url_refs_.empty());
return url_refs_.back();
}
const TemplateURLRef& suggestions_url_ref() const {
return suggestions_url_ref_;
}
const TemplateURLRef& image_url_ref() const { return image_url_ref_; }
const TemplateURLRef& new_tab_url_ref() const { return new_tab_url_ref_; }
const TemplateURLRef& contextual_search_url_ref() const {
return contextual_search_url_ref_;
}
Type type() const { return type_; }
const AssociatedExtensionInfo* GetExtensionInfoForTesting() const {
return extension_info_.get();
}
// Returns true if |url| supports replacement.
bool SupportsReplacement(const SearchTermsData& search_terms_data) const;
// Returns true if any URLRefs use Googe base URLs.
bool HasGoogleBaseURLs(const SearchTermsData& search_terms_data) const;
// Returns true if this TemplateURL uses Google base URLs and has a keyword
// of "google.TLD". We use this to decide whether we can automatically
// update the keyword to reflect the current Google base URL TLD.
bool IsGoogleSearchURLWithReplaceableKeyword(
const SearchTermsData& search_terms_data) const;
// Returns true if the keywords match or if
// IsGoogleSearchURLWithReplaceableKeyword() is true for both |this| and
// |other|.
bool HasSameKeywordAs(const TemplateURLData& other,
const SearchTermsData& search_terms_data) const;
// Returns the id of the extension that added this search engine. Only call
// this for TemplateURLs of type NORMAL_CONTROLLED_BY_EXTENSION or
// OMNIBOX_API_EXTENSION.
std::string GetExtensionId() const;
// Returns the type of this search engine, or SEARCH_ENGINE_OTHER if no
// engines match.
SearchEngineType GetEngineType(
const SearchTermsData& search_terms_data) const;
// Use the alternate URLs and the search URL to match the provided |url|
// and extract |search_terms| from it. Returns false and an empty
// |search_terms| if no search terms can be matched. The URLs are matched in
// the order listed in |url_refs_| (see comment there).
bool ExtractSearchTermsFromURL(const GURL& url,
const SearchTermsData& search_terms_data,
base::string16* search_terms) const;
// Returns true if non-empty search terms could be extracted from |url| using
// ExtractSearchTermsFromURL(). In other words, this returns whether |url|
// could be the result of performing a search with |this|.
bool IsSearchURL(const GURL& url,
const SearchTermsData& search_terms_data) const;
// Given a |url| corresponding to this TemplateURL, identifies the search
// terms and replaces them with the ones in |search_terms_args|, leaving the
// other parameters untouched. If the replacement fails, returns false and
// leaves |result| untouched. This is used by mobile ports to perform query
// refinement.
bool ReplaceSearchTermsInURL(
const GURL& url,
const TemplateURLRef::SearchTermsArgs& search_terms_args,
const SearchTermsData& search_terms_data,
GURL* result) const;
// Encodes the search terms from |search_terms_args| so that we know the
// |input_encoding|. Returns the |encoded_terms| and the
// |encoded_original_query|. |encoded_terms| may be escaped as path or query
// depending on |is_in_query|; |encoded_original_query| is always escaped as
// query.
void EncodeSearchTerms(
const TemplateURLRef::SearchTermsArgs& search_terms_args,
bool is_in_query,
std::string* input_encoding,
base::string16* encoded_terms,
base::string16* encoded_original_query) const;
// Returns the search url for this template URL.
// Returns an empty GURL if this template URL has no url().
GURL GenerateSearchURL(const SearchTermsData& search_terms_data) const;
// TemplateURL internally caches values derived from a passed SearchTermsData
// to make its functions quick. This method invalidates any cached values and
// it should be called after SearchTermsData has been changed.
void InvalidateCachedValues() const;
// Estimates dynamic memory usage.
// See base/trace_event/memory_usage_estimator.h for more info.
size_t EstimateMemoryUsage() const;
private:
friend class TemplateURLService;
void CopyFrom(const TemplateURL& other);
void SetURL(const std::string& url);
void SetPrepopulateId(int id);
// Resets the keyword if IsGoogleSearchURLWithReplaceableKeyword() or |force|.
// The |force| parameter is useful when the existing keyword is known to be
// a placeholder. The resulting keyword is generated using
// GenerateSearchURL() and GenerateKeyword().
void ResetKeywordIfNecessary(const SearchTermsData& search_terms_data,
bool force);
// Resizes the |url_refs_| vector, which always holds the search URL as the
// last item.
void ResizeURLRefVector();
// Uses the alternate URLs and the search URL to match the provided |url|
// and extract |search_terms| from it as well as the |search_terms_component|
// (either REF or QUERY) and |search_terms_component| at which the
// |search_terms| are found in |url|. See also ExtractSearchTermsFromURL().
bool FindSearchTermsInURL(const GURL& url,
const SearchTermsData& search_terms_data,
base::string16* search_terms,
url::Parsed::ComponentType* search_terms_component,
url::Component* search_terms_position) const;
TemplateURLData data_;
// Contains TemplateURLRefs corresponding to the alternate URLs and the search
// URL, in priority order: the URL at index 0 is treated as the highest
// priority and the primary search URL is treated as the lowest priority. For
// example, if a TemplateURL has alternate URL "http://foo/#q={searchTerms}"
// and search URL "http://foo/?q={searchTerms}", and the URL to be decoded is
// "http://foo/?q=a#q=b", the alternate URL will match first and the decoded
// search term will be "b". Note that since every TemplateURLRef has a
// primary search URL, this vector is never empty.
std::vector<TemplateURLRef> url_refs_;
TemplateURLRef suggestions_url_ref_;
TemplateURLRef image_url_ref_;
TemplateURLRef new_tab_url_ref_;
TemplateURLRef contextual_search_url_ref_;
std::unique_ptr<AssociatedExtensionInfo> extension_info_;
const Type type_;
// Caches the computed engine type across successive calls to GetEngineType().
mutable SearchEngineType engine_type_;
// TODO(sky): Add date last parsed OSD file.
DISALLOW_COPY_AND_ASSIGN(TemplateURL);
};
#endif // COMPONENTS_SEARCH_ENGINES_TEMPLATE_URL_H_
|