Home | History | Annotate | Download | only in http
      1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.
      2 // Use of this source code is governed by a BSD-style license that can be
      3 // found in the LICENSE file.
      4 
      5 // This file declares a HttpTransactionFactory implementation that can be
      6 // layered on top of another HttpTransactionFactory to add HTTP caching.  The
      7 // caching logic follows RFC 2616 (any exceptions are called out in the code).
      8 //
      9 // The HttpCache takes a disk_cache::Backend as a parameter, and uses that for
     10 // the cache storage.
     11 //
     12 // See HttpTransactionFactory and HttpTransaction for more details.
     13 
     14 #ifndef NET_HTTP_HTTP_CACHE_H_
     15 #define NET_HTTP_HTTP_CACHE_H_
     16 
     17 #include <list>
     18 #include <set>
     19 #include <string>
     20 
     21 #include "base/basictypes.h"
     22 #include "base/containers/hash_tables.h"
     23 #include "base/files/file_path.h"
     24 #include "base/memory/scoped_ptr.h"
     25 #include "base/memory/weak_ptr.h"
     26 #include "base/message_loop/message_loop_proxy.h"
     27 #include "base/threading/non_thread_safe.h"
     28 #include "base/time/time.h"
     29 #include "net/base/cache_type.h"
     30 #include "net/base/completion_callback.h"
     31 #include "net/base/load_states.h"
     32 #include "net/base/net_export.h"
     33 #include "net/base/request_priority.h"
     34 #include "net/http/http_network_session.h"
     35 #include "net/http/http_transaction_factory.h"
     36 
     37 class GURL;
     38 
     39 namespace disk_cache {
     40 class Backend;
     41 class Entry;
     42 }
     43 
     44 namespace net {
     45 
     46 class CertVerifier;
     47 class HostResolver;
     48 class HttpAuthHandlerFactory;
     49 class HttpNetworkSession;
     50 class HttpResponseInfo;
     51 class HttpServerProperties;
     52 class IOBuffer;
     53 class NetLog;
     54 class NetworkDelegate;
     55 class ServerBoundCertService;
     56 class ProxyService;
     57 class SSLConfigService;
     58 class TransportSecurityState;
     59 class ViewCacheHelper;
     60 struct HttpRequestInfo;
     61 
     62 class NET_EXPORT HttpCache : public HttpTransactionFactory,
     63                              public base::SupportsWeakPtr<HttpCache>,
     64                              NON_EXPORTED_BASE(public base::NonThreadSafe) {
     65  public:
     66   // The cache mode of operation.
     67   enum Mode {
     68     // Normal mode just behaves like a standard web cache.
     69     NORMAL = 0,
     70     // Record mode caches everything for purposes of offline playback.
     71     RECORD,
     72     // Playback mode replays from a cache without considering any
     73     // standard invalidations.
     74     PLAYBACK,
     75     // Disables reads and writes from the cache.
     76     // Equivalent to setting LOAD_DISABLE_CACHE on every request.
     77     DISABLE
     78   };
     79 
     80   // A BackendFactory creates a backend object to be used by the HttpCache.
     81   class NET_EXPORT BackendFactory {
     82    public:
     83     virtual ~BackendFactory() {}
     84 
     85     // The actual method to build the backend. Returns a net error code. If
     86     // ERR_IO_PENDING is returned, the |callback| will be notified when the
     87     // operation completes, and |backend| must remain valid until the
     88     // notification arrives.
     89     // The implementation must not access the factory object after invoking the
     90     // |callback| because the object can be deleted from within the callback.
     91     virtual int CreateBackend(NetLog* net_log,
     92                               scoped_ptr<disk_cache::Backend>* backend,
     93                               const CompletionCallback& callback) = 0;
     94   };
     95 
     96   // A default backend factory for the common use cases.
     97   class NET_EXPORT DefaultBackend : public BackendFactory {
     98    public:
     99     // |path| is the destination for any files used by the backend, and
    100     // |cache_thread| is the thread where disk operations should take place. If
    101     // |max_bytes| is  zero, a default value will be calculated automatically.
    102     DefaultBackend(CacheType type, BackendType backend_type,
    103                    const base::FilePath& path, int max_bytes,
    104                    base::MessageLoopProxy* thread);
    105     virtual ~DefaultBackend();
    106 
    107     // Returns a factory for an in-memory cache.
    108     static BackendFactory* InMemory(int max_bytes);
    109 
    110     // BackendFactory implementation.
    111     virtual int CreateBackend(NetLog* net_log,
    112                               scoped_ptr<disk_cache::Backend>* backend,
    113                               const CompletionCallback& callback) OVERRIDE;
    114 
    115    private:
    116     CacheType type_;
    117     BackendType backend_type_;
    118     const base::FilePath path_;
    119     int max_bytes_;
    120     scoped_refptr<base::MessageLoopProxy> thread_;
    121   };
    122 
    123   // The disk cache is initialized lazily (by CreateTransaction) in this case.
    124   // The HttpCache takes ownership of the |backend_factory|.
    125   HttpCache(const net::HttpNetworkSession::Params& params,
    126             BackendFactory* backend_factory);
    127 
    128   // The disk cache is initialized lazily (by CreateTransaction) in  this case.
    129   // Provide an existing HttpNetworkSession, the cache can construct a
    130   // network layer with a shared HttpNetworkSession in order for multiple
    131   // network layers to share information (e.g. authentication data). The
    132   // HttpCache takes ownership of the |backend_factory|.
    133   HttpCache(HttpNetworkSession* session, BackendFactory* backend_factory);
    134 
    135   // Initialize the cache from its component parts, which is useful for
    136   // testing.  The lifetime of the network_layer and backend_factory are managed
    137   // by the HttpCache and will be destroyed using |delete| when the HttpCache is
    138   // destroyed.
    139   HttpCache(HttpTransactionFactory* network_layer,
    140             NetLog* net_log,
    141             BackendFactory* backend_factory);
    142 
    143   virtual ~HttpCache();
    144 
    145   HttpTransactionFactory* network_layer() { return network_layer_.get(); }
    146 
    147   // Retrieves the cache backend for this HttpCache instance. If the backend
    148   // is not initialized yet, this method will initialize it. The return value is
    149   // a network error code, and it could be ERR_IO_PENDING, in which case the
    150   // |callback| will be notified when the operation completes. The pointer that
    151   // receives the |backend| must remain valid until the operation completes.
    152   int GetBackend(disk_cache::Backend** backend,
    153                  const net::CompletionCallback& callback);
    154 
    155   // Returns the current backend (can be NULL).
    156   disk_cache::Backend* GetCurrentBackend() const;
    157 
    158   // Given a header data blob, convert it to a response info object.
    159   static bool ParseResponseInfo(const char* data, int len,
    160                                 HttpResponseInfo* response_info,
    161                                 bool* response_truncated);
    162 
    163   // Writes |buf_len| bytes of metadata stored in |buf| to the cache entry
    164   // referenced by |url|, as long as the entry's |expected_response_time| has
    165   // not changed. This method returns without blocking, and the operation will
    166   // be performed asynchronously without any completion notification.
    167   void WriteMetadata(const GURL& url,
    168                      RequestPriority priority,
    169                      base::Time expected_response_time,
    170                      IOBuffer* buf,
    171                      int buf_len);
    172 
    173   // Get/Set the cache's mode.
    174   void set_mode(Mode value) { mode_ = value; }
    175   Mode mode() { return mode_; }
    176 
    177   // Close currently active sockets so that fresh page loads will not use any
    178   // recycled connections.  For sockets currently in use, they may not close
    179   // immediately, but they will not be reusable. This is for debugging.
    180   void CloseAllConnections();
    181 
    182   // Close all idle connections. Will close all sockets not in active use.
    183   void CloseIdleConnections();
    184 
    185   // Called whenever an external cache in the system reuses the resource
    186   // referred to by |url| and |http_method|.
    187   void OnExternalCacheHit(const GURL& url, const std::string& http_method);
    188 
    189   // Initializes the Infinite Cache, if selected by the field trial.
    190   void InitializeInfiniteCache(const base::FilePath& path);
    191 
    192   // HttpTransactionFactory implementation:
    193   virtual int CreateTransaction(RequestPriority priority,
    194                                 scoped_ptr<HttpTransaction>* trans,
    195                                 HttpTransactionDelegate* delegate) OVERRIDE;
    196   virtual HttpCache* GetCache() OVERRIDE;
    197   virtual HttpNetworkSession* GetSession() OVERRIDE;
    198 
    199  protected:
    200   // Disk cache entry data indices.
    201   enum {
    202     kResponseInfoIndex = 0,
    203     kResponseContentIndex,
    204     kMetadataIndex,
    205 
    206     // Must remain at the end of the enum.
    207     kNumCacheEntryDataIndices
    208   };
    209   friend class ViewCacheHelper;
    210 
    211  private:
    212   // Types --------------------------------------------------------------------
    213 
    214   class MetadataWriter;
    215   class Transaction;
    216   class WorkItem;
    217   friend class Transaction;
    218   struct PendingOp;  // Info for an entry under construction.
    219 
    220   typedef std::list<Transaction*> TransactionList;
    221   typedef std::list<WorkItem*> WorkItemList;
    222 
    223   struct ActiveEntry {
    224     explicit ActiveEntry(disk_cache::Entry* entry);
    225     ~ActiveEntry();
    226 
    227     disk_cache::Entry* disk_entry;
    228     Transaction*       writer;
    229     TransactionList    readers;
    230     TransactionList    pending_queue;
    231     bool               will_process_pending_queue;
    232     bool               doomed;
    233   };
    234 
    235   typedef base::hash_map<std::string, ActiveEntry*> ActiveEntriesMap;
    236   typedef base::hash_map<std::string, PendingOp*> PendingOpsMap;
    237   typedef std::set<ActiveEntry*> ActiveEntriesSet;
    238   typedef base::hash_map<std::string, int> PlaybackCacheMap;
    239 
    240   // Methods ------------------------------------------------------------------
    241 
    242   // Creates the |backend| object and notifies the |callback| when the operation
    243   // completes. Returns an error code.
    244   int CreateBackend(disk_cache::Backend** backend,
    245                     const net::CompletionCallback& callback);
    246 
    247   // Makes sure that the backend creation is complete before allowing the
    248   // provided transaction to use the object. Returns an error code.  |trans|
    249   // will be notified via its IO callback if this method returns ERR_IO_PENDING.
    250   // The transaction is free to use the backend directly at any time after
    251   // receiving the notification.
    252   int GetBackendForTransaction(Transaction* trans);
    253 
    254   // Generates the cache key for this request.
    255   std::string GenerateCacheKey(const HttpRequestInfo*);
    256 
    257   // Dooms the entry selected by |key|, if it is currently in the list of active
    258   // entries.
    259   void DoomActiveEntry(const std::string& key);
    260 
    261   // Dooms the entry selected by |key|. |trans| will be notified via its IO
    262   // callback if this method returns ERR_IO_PENDING. The entry can be
    263   // currently in use or not.
    264   int DoomEntry(const std::string& key, Transaction* trans);
    265 
    266   // Dooms the entry selected by |key|. |trans| will be notified via its IO
    267   // callback if this method returns ERR_IO_PENDING. The entry should not
    268   // be currently in use.
    269   int AsyncDoomEntry(const std::string& key, Transaction* trans);
    270 
    271   // Dooms the entry associated with a GET for a given |url|.
    272   void DoomMainEntryForUrl(const GURL& url);
    273 
    274   // Closes a previously doomed entry.
    275   void FinalizeDoomedEntry(ActiveEntry* entry);
    276 
    277   // Returns an entry that is currently in use and not doomed, or NULL.
    278   ActiveEntry* FindActiveEntry(const std::string& key);
    279 
    280   // Creates a new ActiveEntry and starts tracking it. |disk_entry| is the disk
    281   // cache entry.
    282   ActiveEntry* ActivateEntry(disk_cache::Entry* disk_entry);
    283 
    284   // Deletes an ActiveEntry.
    285   void DeactivateEntry(ActiveEntry* entry);
    286 
    287   // Deletes an ActiveEntry using an exhaustive search.
    288   void SlowDeactivateEntry(ActiveEntry* entry);
    289 
    290   // Returns the PendingOp for the desired |key|. If an entry is not under
    291   // construction already, a new PendingOp structure is created.
    292   PendingOp* GetPendingOp(const std::string& key);
    293 
    294   // Deletes a PendingOp.
    295   void DeletePendingOp(PendingOp* pending_op);
    296 
    297   // Opens the disk cache entry associated with |key|, returning an ActiveEntry
    298   // in |*entry|. |trans| will be notified via its IO callback if this method
    299   // returns ERR_IO_PENDING.
    300   int OpenEntry(const std::string& key, ActiveEntry** entry,
    301                 Transaction* trans);
    302 
    303   // Creates the disk cache entry associated with |key|, returning an
    304   // ActiveEntry in |*entry|. |trans| will be notified via its IO callback if
    305   // this method returns ERR_IO_PENDING.
    306   int CreateEntry(const std::string& key, ActiveEntry** entry,
    307                   Transaction* trans);
    308 
    309   // Destroys an ActiveEntry (active or doomed).
    310   void DestroyEntry(ActiveEntry* entry);
    311 
    312   // Adds a transaction to an ActiveEntry. If this method returns ERR_IO_PENDING
    313   // the transaction will be notified about completion via its IO callback. This
    314   // method returns ERR_CACHE_RACE to signal the transaction that it cannot be
    315   // added to the provided entry, and it should retry the process with another
    316   // one (in this case, the entry is no longer valid).
    317   int AddTransactionToEntry(ActiveEntry* entry, Transaction* trans);
    318 
    319   // Called when the transaction has finished working with this entry. |cancel|
    320   // is true if the operation was cancelled by the caller instead of running
    321   // to completion.
    322   void DoneWithEntry(ActiveEntry* entry, Transaction* trans, bool cancel);
    323 
    324   // Called when the transaction has finished writing to this entry. |success|
    325   // is false if the cache entry should be deleted.
    326   void DoneWritingToEntry(ActiveEntry* entry, bool success);
    327 
    328   // Called when the transaction has finished reading from this entry.
    329   void DoneReadingFromEntry(ActiveEntry* entry, Transaction* trans);
    330 
    331   // Converts the active writer transaction to a reader so that other
    332   // transactions can start reading from this entry.
    333   void ConvertWriterToReader(ActiveEntry* entry);
    334 
    335   // Returns the LoadState of the provided pending transaction.
    336   LoadState GetLoadStateForPendingTransaction(const Transaction* trans);
    337 
    338   // Removes the transaction |trans|, from the pending list of an entry
    339   // (PendingOp, active or doomed entry).
    340   void RemovePendingTransaction(Transaction* trans);
    341 
    342   // Removes the transaction |trans|, from the pending list of |entry|.
    343   bool RemovePendingTransactionFromEntry(ActiveEntry* entry,
    344                                          Transaction* trans);
    345 
    346   // Removes the transaction |trans|, from the pending list of |pending_op|.
    347   bool RemovePendingTransactionFromPendingOp(PendingOp* pending_op,
    348                                              Transaction* trans);
    349 
    350   // Resumes processing the pending list of |entry|.
    351   void ProcessPendingQueue(ActiveEntry* entry);
    352 
    353   // Events (called via PostTask) ---------------------------------------------
    354 
    355   void OnProcessPendingQueue(ActiveEntry* entry);
    356 
    357   // Callbacks ----------------------------------------------------------------
    358 
    359   // Processes BackendCallback notifications.
    360   void OnIOComplete(int result, PendingOp* entry);
    361 
    362   // Helper to conditionally delete |pending_op| if the HttpCache object it
    363   // is meant for has been deleted.
    364   //
    365   // TODO(ajwong): The PendingOp lifetime management is very tricky.  It might
    366   // be possible to simplify it using either base::Owned() or base::Passed()
    367   // with the callback.
    368   static void OnPendingOpComplete(const base::WeakPtr<HttpCache>& cache,
    369                                   PendingOp* pending_op,
    370                                   int result);
    371 
    372   // Processes the backend creation notification.
    373   void OnBackendCreated(int result, PendingOp* pending_op);
    374 
    375   // Variables ----------------------------------------------------------------
    376 
    377   NetLog* net_log_;
    378 
    379   // Used when lazily constructing the disk_cache_.
    380   scoped_ptr<BackendFactory> backend_factory_;
    381   bool building_backend_;
    382 
    383   Mode mode_;
    384 
    385   const scoped_ptr<HttpTransactionFactory> network_layer_;
    386   scoped_ptr<disk_cache::Backend> disk_cache_;
    387 
    388   // The set of active entries indexed by cache key.
    389   ActiveEntriesMap active_entries_;
    390 
    391   // The set of doomed entries.
    392   ActiveEntriesSet doomed_entries_;
    393 
    394   // The set of entries "under construction".
    395   PendingOpsMap pending_ops_;
    396 
    397   scoped_ptr<PlaybackCacheMap> playback_cache_map_;
    398 
    399   DISALLOW_COPY_AND_ASSIGN(HttpCache);
    400 };
    401 
    402 }  // namespace net
    403 
    404 #endif  // NET_HTTP_HTTP_CACHE_H_
    405