Home | History | Annotate | Download | only in autocomplete
      1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.
      2 // Use of this source code is governed by a BSD-style license that can be
      3 // found in the LICENSE file.
      4 
      5 #include "chrome/browser/autocomplete/autocomplete_input.h"
      6 
      7 #include "base/basictypes.h"
      8 #include "base/strings/string16.h"
      9 #include "base/strings/utf_string_conversions.h"
     10 #include "build/build_config.h"
     11 #include "testing/gtest/include/gtest/gtest.h"
     12 #include "url/url_parse.h"
     13 
     14 TEST(AutocompleteInputTest, InputType) {
     15   struct test_data {
     16     const string16 input;
     17     const AutocompleteInput::Type type;
     18   } input_cases[] = {
     19     { string16(), AutocompleteInput::INVALID },
     20     { ASCIIToUTF16("?"), AutocompleteInput::FORCED_QUERY },
     21     { ASCIIToUTF16("?foo"), AutocompleteInput::FORCED_QUERY },
     22     { ASCIIToUTF16("?foo bar"), AutocompleteInput::FORCED_QUERY },
     23     { ASCIIToUTF16("?http://foo.com/bar"), AutocompleteInput::FORCED_QUERY },
     24     { ASCIIToUTF16("foo"), AutocompleteInput::UNKNOWN },
     25     { ASCIIToUTF16("localhost"), AutocompleteInput::URL },
     26     { ASCIIToUTF16("foo.c"), AutocompleteInput::UNKNOWN },
     27     { ASCIIToUTF16("foo.com"), AutocompleteInput::URL },
     28     { ASCIIToUTF16("-foo.com"), AutocompleteInput::URL },
     29     { ASCIIToUTF16("foo-.com"), AutocompleteInput::URL },
     30     { ASCIIToUTF16("foo_.com"), AutocompleteInput::UNKNOWN },
     31     { ASCIIToUTF16("foo.-com"), AutocompleteInput::QUERY },
     32     { ASCIIToUTF16("foo/"), AutocompleteInput::URL },
     33     { ASCIIToUTF16("foo/bar"), AutocompleteInput::UNKNOWN },
     34     { ASCIIToUTF16("foo/bar/"), AutocompleteInput::URL },
     35     { ASCIIToUTF16("foo/bar baz\\"), AutocompleteInput::URL },
     36     { ASCIIToUTF16("foo.com/bar"), AutocompleteInput::URL },
     37     { ASCIIToUTF16("foo;bar"), AutocompleteInput::UNKNOWN },
     38     { ASCIIToUTF16("foo/bar baz"), AutocompleteInput::UNKNOWN },
     39     { ASCIIToUTF16("foo bar.com"), AutocompleteInput::QUERY },
     40     { ASCIIToUTF16("foo bar"), AutocompleteInput::QUERY },
     41     { ASCIIToUTF16("foo+bar"), AutocompleteInput::QUERY },
     42     { ASCIIToUTF16("foo+bar.com"), AutocompleteInput::UNKNOWN },
     43     { ASCIIToUTF16("\"foo:bar\""), AutocompleteInput::QUERY },
     44     { ASCIIToUTF16("link:foo.com"), AutocompleteInput::UNKNOWN },
     45     { ASCIIToUTF16("foo:81"), AutocompleteInput::URL },
     46     { ASCIIToUTF16("localhost:8080"), AutocompleteInput::URL },
     47     { ASCIIToUTF16("www.foo.com:81"), AutocompleteInput::URL },
     48     { ASCIIToUTF16("foo.com:123456"), AutocompleteInput::QUERY },
     49     { ASCIIToUTF16("foo.com:abc"), AutocompleteInput::QUERY },
     50     { ASCIIToUTF16("1.2.3.4:abc"), AutocompleteInput::QUERY },
     51     { ASCIIToUTF16("user (at) foo.com"), AutocompleteInput::UNKNOWN },
     52     { ASCIIToUTF16("user@foo/z"), AutocompleteInput::URL },
     53     { ASCIIToUTF16("user@foo/z z"), AutocompleteInput::URL },
     54     { ASCIIToUTF16("user (at) foo.com/z"), AutocompleteInput::URL },
     55     { ASCIIToUTF16("user:pass@"), AutocompleteInput::UNKNOWN },
     56     { ASCIIToUTF16("user:pass@!foo.com"), AutocompleteInput::UNKNOWN },
     57     { ASCIIToUTF16("user:pass@foo"), AutocompleteInput::URL },
     58     { ASCIIToUTF16("user:pass (at) foo.c"), AutocompleteInput::URL },
     59     { ASCIIToUTF16("user:pass (at) foo.com"), AutocompleteInput::URL },
     60     { ASCIIToUTF16("user:pass (at) foo.com:81"), AutocompleteInput::URL },
     61     { ASCIIToUTF16("user:pass@foo:81"), AutocompleteInput::URL },
     62     { ASCIIToUTF16("1.2"), AutocompleteInput::UNKNOWN },
     63     { ASCIIToUTF16("1.2/45"), AutocompleteInput::UNKNOWN },
     64     { ASCIIToUTF16("1.2:45"), AutocompleteInput::UNKNOWN },
     65     { ASCIIToUTF16("user (at) 1.2:45"), AutocompleteInput::URL },
     66     { ASCIIToUTF16("user@foo:45"), AutocompleteInput::URL },
     67     { ASCIIToUTF16("user:pass (at) 1.2:45"), AutocompleteInput::URL },
     68     { ASCIIToUTF16("host?query"), AutocompleteInput::UNKNOWN },
     69     { ASCIIToUTF16("host#ref"), AutocompleteInput::UNKNOWN },
     70     { ASCIIToUTF16("host/path?query"), AutocompleteInput::URL },
     71     { ASCIIToUTF16("host/path#ref"), AutocompleteInput::URL },
     72     { ASCIIToUTF16("en.wikipedia.org/wiki/Jim Beam"), AutocompleteInput::URL },
     73     // In Chrome itself, mailto: will get handled by ShellExecute, but in
     74     // unittest mode, we don't have the data loaded in the external protocol
     75     // handler to know this.
     76     // { ASCIIToUTF16("mailto:abuse (at) foo.com"), AutocompleteInput::URL },
     77     { ASCIIToUTF16("view-source:http://www.foo.com/"), AutocompleteInput::URL },
     78     { ASCIIToUTF16("javascript:alert(\"Hi there\");"), AutocompleteInput::URL },
     79 #if defined(OS_WIN)
     80     { ASCIIToUTF16("C:\\Program Files"), AutocompleteInput::URL },
     81     { ASCIIToUTF16("\\\\Server\\Folder\\File"), AutocompleteInput::URL },
     82 #endif  // defined(OS_WIN)
     83     { ASCIIToUTF16("http:foo"), AutocompleteInput::URL },
     84     { ASCIIToUTF16("http://foo"), AutocompleteInput::URL },
     85     { ASCIIToUTF16("http://foo.c"), AutocompleteInput::URL },
     86     { ASCIIToUTF16("http://foo.com"), AutocompleteInput::URL },
     87     { ASCIIToUTF16("http://foo_bar.com"), AutocompleteInput::URL },
     88     { ASCIIToUTF16("http://foo/bar baz"), AutocompleteInput::URL },
     89     { ASCIIToUTF16("http://-foo.com"), AutocompleteInput::URL },
     90     { ASCIIToUTF16("http://foo-.com"), AutocompleteInput::URL },
     91     { ASCIIToUTF16("http://foo_.com"), AutocompleteInput::UNKNOWN },
     92     { ASCIIToUTF16("http://foo.-com"), AutocompleteInput::UNKNOWN },
     93     { ASCIIToUTF16("http://_foo_.com"), AutocompleteInput::UNKNOWN },
     94     { ASCIIToUTF16("http://foo.com:abc"), AutocompleteInput::QUERY },
     95     { ASCIIToUTF16("http://foo.com:123456"), AutocompleteInput::QUERY },
     96     { ASCIIToUTF16("http://1.2.3.4:abc"), AutocompleteInput::QUERY },
     97     { ASCIIToUTF16("http:user (at) foo.com"), AutocompleteInput::URL },
     98     { ASCIIToUTF16("http://user@foo.com"), AutocompleteInput::URL },
     99     { ASCIIToUTF16("http:user:pass (at) foo.com"), AutocompleteInput::URL },
    100     { ASCIIToUTF16("http://user:pass@foo.com"), AutocompleteInput::URL },
    101     { ASCIIToUTF16("http://1.2"), AutocompleteInput::URL },
    102     { ASCIIToUTF16("http://1.2/45"), AutocompleteInput::URL },
    103     { ASCIIToUTF16("http:ps/2 games"), AutocompleteInput::URL },
    104     { ASCIIToUTF16("https://foo.com"), AutocompleteInput::URL },
    105     { ASCIIToUTF16("127.0.0.1"), AutocompleteInput::URL },
    106     { ASCIIToUTF16("127.0.1"), AutocompleteInput::UNKNOWN },
    107     { ASCIIToUTF16("127.0.1/"), AutocompleteInput::URL },
    108     { ASCIIToUTF16("browser.tabs.closeButtons"), AutocompleteInput::UNKNOWN },
    109     { WideToUTF16(L"\u6d4b\u8bd5"), AutocompleteInput::UNKNOWN },
    110     { ASCIIToUTF16("[2001:]"), AutocompleteInput::QUERY },
    111     { ASCIIToUTF16("[2001:dB8::1]"), AutocompleteInput::URL },
    112     { ASCIIToUTF16("192.168.0.256"), AutocompleteInput::QUERY },
    113     { ASCIIToUTF16("[foo.com]"), AutocompleteInput::QUERY },
    114     { ASCIIToUTF16("filesystem:http://a.com/t/bar"), AutocompleteInput::URL },
    115     { ASCIIToUTF16("filesystem:http:foo"), AutocompleteInput::URL },
    116     { ASCIIToUTF16("filesystem:file://"), AutocompleteInput::URL },
    117     { ASCIIToUTF16("filesystem:http"), AutocompleteInput::URL },
    118     { ASCIIToUTF16("filesystem:"), AutocompleteInput::URL },
    119     { ASCIIToUTF16("ftp:"), AutocompleteInput::URL },
    120   };
    121 
    122   for (size_t i = 0; i < ARRAYSIZE_UNSAFE(input_cases); ++i) {
    123     SCOPED_TRACE(input_cases[i].input);
    124     AutocompleteInput input(input_cases[i].input, string16::npos, string16(),
    125                             GURL(), AutocompleteInput::INVALID_SPEC, true,
    126                             false, true, AutocompleteInput::ALL_MATCHES);
    127     EXPECT_EQ(input_cases[i].type, input.type());
    128   }
    129 }
    130 
    131 TEST(AutocompleteInputTest, InputTypeWithDesiredTLD) {
    132   struct test_data {
    133     const string16 input;
    134     const AutocompleteInput::Type type;
    135     const std::string spec;  // Unused if not a URL.
    136   } input_cases[] = {
    137     { ASCIIToUTF16("401k"), AutocompleteInput::URL,
    138         std::string("http://www.401k.com/") },
    139     { ASCIIToUTF16("999999999999999"), AutocompleteInput::URL,
    140         std::string("http://www.999999999999999.com/") },
    141     { ASCIIToUTF16("x@y"), AutocompleteInput::URL,
    142         std::string("http://x@www.y.com/") },
    143     { ASCIIToUTF16("y/z z"), AutocompleteInput::URL,
    144         std::string("http://www.y.com/z%20z") },
    145     { ASCIIToUTF16("abc.com"), AutocompleteInput::URL,
    146         std::string("http://abc.com/") },
    147     { ASCIIToUTF16("foo bar"), AutocompleteInput::QUERY, std::string() },
    148   };
    149 
    150   for (size_t i = 0; i < ARRAYSIZE_UNSAFE(input_cases); ++i) {
    151     SCOPED_TRACE(input_cases[i].input);
    152     AutocompleteInput input(input_cases[i].input, string16::npos,
    153                             ASCIIToUTF16("com"), GURL(),
    154                             AutocompleteInput::INVALID_SPEC, true, false, true,
    155                             AutocompleteInput::ALL_MATCHES);
    156     EXPECT_EQ(input_cases[i].type, input.type());
    157     if (input_cases[i].type == AutocompleteInput::URL)
    158       EXPECT_EQ(input_cases[i].spec, input.canonicalized_url().spec());
    159   }
    160 }
    161 
    162 // This tests for a regression where certain input in the omnibox caused us to
    163 // crash. As long as the test completes without crashing, we're fine.
    164 TEST(AutocompleteInputTest, InputCrash) {
    165   AutocompleteInput input(WideToUTF16(L"\uff65@s"), string16::npos, string16(),
    166                           GURL(), AutocompleteInput::INVALID_SPEC, true, false,
    167                           true, AutocompleteInput::ALL_MATCHES);
    168 }
    169 
    170 TEST(AutocompleteInputTest, ParseForEmphasizeComponent) {
    171   using url_parse::Component;
    172   Component kInvalidComponent(0, -1);
    173   struct test_data {
    174     const string16 input;
    175     const Component scheme;
    176     const Component host;
    177   } input_cases[] = {
    178     { string16(), kInvalidComponent, kInvalidComponent },
    179     { ASCIIToUTF16("?"), kInvalidComponent, kInvalidComponent },
    180     { ASCIIToUTF16("?http://foo.com/bar"), kInvalidComponent,
    181         kInvalidComponent },
    182     { ASCIIToUTF16("foo/bar baz"), kInvalidComponent, Component(0, 3) },
    183     { ASCIIToUTF16("http://foo/bar baz"), Component(0, 4), Component(7, 3) },
    184     { ASCIIToUTF16("link:foo.com"), Component(0, 4), kInvalidComponent },
    185     { ASCIIToUTF16("www.foo.com:81"), kInvalidComponent, Component(0, 11) },
    186     { WideToUTF16(L"\u6d4b\u8bd5"), kInvalidComponent, Component(0, 2) },
    187     { ASCIIToUTF16("view-source:http://www.foo.com/"), Component(12, 4),
    188         Component(19, 11) },
    189     { ASCIIToUTF16("view-source:https://example.com/"),
    190       Component(12, 5), Component(20, 11) },
    191     { ASCIIToUTF16("view-source:www.foo.com"), kInvalidComponent,
    192         Component(12, 11) },
    193     { ASCIIToUTF16("view-source:"), Component(0, 11), kInvalidComponent },
    194     { ASCIIToUTF16("view-source:garbage"), kInvalidComponent,
    195         Component(12, 7) },
    196     { ASCIIToUTF16("view-source:http://http://foo"), Component(12, 4),
    197         Component(19, 4) },
    198     { ASCIIToUTF16("view-source:view-source:http://example.com/"),
    199         Component(12, 11), kInvalidComponent }
    200   };
    201 
    202   for (size_t i = 0; i < ARRAYSIZE_UNSAFE(input_cases); ++i) {
    203     SCOPED_TRACE(input_cases[i].input);
    204     Component scheme, host;
    205     AutocompleteInput::ParseForEmphasizeComponents(input_cases[i].input,
    206                                                    &scheme,
    207                                                    &host);
    208     AutocompleteInput input(input_cases[i].input, string16::npos, string16(),
    209                             GURL(), AutocompleteInput::INVALID_SPEC, true,
    210                             false, true, AutocompleteInput::ALL_MATCHES);
    211     EXPECT_EQ(input_cases[i].scheme.begin, scheme.begin);
    212     EXPECT_EQ(input_cases[i].scheme.len, scheme.len);
    213     EXPECT_EQ(input_cases[i].host.begin, host.begin);
    214     EXPECT_EQ(input_cases[i].host.len, host.len);
    215   }
    216 }
    217 
    218 TEST(AutocompleteInputTest, InputTypeWithCursorPosition) {
    219   struct test_data {
    220     const string16 input;
    221     size_t cursor_position;
    222     const string16 normalized_input;
    223     size_t normalized_cursor_position;
    224   } input_cases[] = {
    225     { ASCIIToUTF16("foo bar"), string16::npos,
    226       ASCIIToUTF16("foo bar"), string16::npos },
    227 
    228     // regular case, no changes.
    229     { ASCIIToUTF16("foo bar"), 3, ASCIIToUTF16("foo bar"), 3 },
    230 
    231     // extra leading space.
    232     { ASCIIToUTF16("  foo bar"), 3, ASCIIToUTF16("foo bar"), 1 },
    233     { ASCIIToUTF16("      foo bar"), 3, ASCIIToUTF16("foo bar"), 0 },
    234     { ASCIIToUTF16("      foo bar   "), 2, ASCIIToUTF16("foo bar   "), 0 },
    235 
    236     // forced query.
    237     { ASCIIToUTF16("?foo bar"), 2, ASCIIToUTF16("foo bar"), 1 },
    238     { ASCIIToUTF16("  ?foo bar"), 4, ASCIIToUTF16("foo bar"), 1 },
    239     { ASCIIToUTF16("?  foo bar"), 4, ASCIIToUTF16("foo bar"), 1 },
    240     { ASCIIToUTF16("  ?  foo bar"), 6, ASCIIToUTF16("foo bar"), 1 },
    241   };
    242 
    243   for (size_t i = 0; i < ARRAYSIZE_UNSAFE(input_cases); ++i) {
    244     SCOPED_TRACE(input_cases[i].input);
    245     AutocompleteInput input(input_cases[i].input,
    246                             input_cases[i].cursor_position,
    247                             string16(), GURL(), AutocompleteInput::INVALID_SPEC,
    248                             true, false, true, AutocompleteInput::ALL_MATCHES);
    249     EXPECT_EQ(input_cases[i].normalized_input, input.text());
    250     EXPECT_EQ(input_cases[i].normalized_cursor_position,
    251               input.cursor_position());
    252   }
    253 }
    254