Home | History | Annotate | Download | only in url_fixer
      1 // Copyright (c) 2011 The Chromium Authors. All rights reserved.
      2 // Use of this source code is governed by a BSD-style license that can be
      3 // found in the LICENSE file.
      4 
      5 #ifndef COMPONENTS_URL_FIXER_URL_FIXER_H_
      6 #define COMPONENTS_URL_FIXER_URL_FIXER_H_
      7 
      8 #include <string>
      9 
     10 #include "base/strings/string16.h"
     11 #include "url/gurl.h"
     12 
     13 namespace base {
     14 class FilePath;
     15 }
     16 
     17 namespace url {
     18 struct Component;
     19 struct Parsed;
     20 }
     21 
     22 // This object is designed to convert various types of input into URLs that we
     23 // know are valid. For example, user typing in the URL bar or command line
     24 // options. This is NOT the place for converting between different types of
     25 // URLs or parsing them, see net_util.h for that.
     26 namespace url_fixer {
     27 
     28   // Segments the given text string into parts of a URL.  This is most useful
     29   // for schemes such as http, https, and ftp where |SegmentURL| will find many
     30   // segments.  Currently does not segment "file" schemes.
     31   // Returns the canonicalized scheme, or the empty string when |text| is only
     32   // whitespace.
     33 std::string SegmentURL(const std::string& text, url::Parsed* parts);
     34 base::string16 SegmentURL(const base::string16& text, url::Parsed* parts);
     35 
     36   // Converts |text| to a fixed-up URL and returns it. Attempts to make
     37   // some "smart" adjustments to obviously-invalid input where possible.
     38   // |text| may be an absolute path to a file, which will get converted to a
     39   // "file:" URL.
     40   //
     41   // The result will be a "more" valid URL than the input. It may still not
     42   // be valid, so check the return value's validity or use
     43   // possibly_invalid_spec().
     44   //
     45   // Schemes "about" and "chrome" are normalized to "chrome://", with slashes.
     46   // "about:blank" is unaltered, as Webkit allows frames to access about:blank.
     47   // Additionally, if a chrome URL does not have a valid host, as in "about:",
     48   // the returned URL will have the host "version", as in "chrome://version".
     49   //
     50   // If |desired_tld| is non-empty, it represents the TLD the user wishes to
     51   // append in the case of an incomplete domain.  We check that this is not a
     52   // file path and there does not appear to be a valid TLD already, then append
     53   // |desired_tld| to the domain and prepend "www." (unless it, or a scheme,
     54   // are already present.)  This TLD should not have a leading '.' (use "com"
     55   // instead of ".com").
     56   GURL FixupURL(const std::string& text, const std::string& desired_tld);
     57 
     58   // Converts |text| to a fixed-up URL, allowing it to be a relative path on
     59   // the local filesystem.  Begin searching in |base_dir|; if empty, use the
     60   // current working directory.  If this resolves to a file on disk, convert it
     61   // to a "file:" URL in |fixed_up_url|; otherwise, fall back to the behavior
     62   // of FixupURL().
     63   //
     64   // For "regular" input, even if it is possibly a file with a full path, you
     65   // should use FixupURL() directly.  This function should only be used when
     66   // relative path handling is desired, as for command line processing.
     67   GURL FixupRelativeFile(const base::FilePath& base_dir,
     68                          const base::FilePath& text);
     69 
     70   // Offsets the beginning index of |part| by |offset|, which is allowed to be
     71   // negative.  In some cases, the desired component does not exist at the given
     72   // offset.  For example, when converting from "http://foo" to "foo", the
     73   // scheme component no longer exists.  In such a case, the beginning index is
     74   // set to 0.
     75   // Does nothing if |part| is invalid.
     76   void OffsetComponent(int offset, url::Component* part);
     77 
     78   // For paths like ~, we use $HOME for the current user's home
     79   // directory.  For tests, we allow our idea of $HOME to be overriden
     80   // by this variable.
     81   extern const char* home_directory_override;
     82 
     83 }  // namespace url_fixer
     84 
     85 #endif  // COMPONENTS_URL_FIXER_URL_FIXER_H_
     86