1// Copyright (c) 2012 The Chromium Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
4
5// This file declares a HttpTransactionFactory implementation that can be
6// layered on top of another HttpTransactionFactory to add HTTP caching.  The
7// caching logic follows RFC 2616 (any exceptions are called out in the code).
8//
9// The HttpCache takes a disk_cache::Backend as a parameter, and uses that for
10// the cache storage.
11//
12// See HttpTransactionFactory and HttpTransaction for more details.
13
14#ifndef NET_HTTP_HTTP_CACHE_H_
15#define NET_HTTP_HTTP_CACHE_H_
16
17#include <list>
18#include <set>
19#include <string>
20
21#include "base/basictypes.h"
22#include "base/containers/hash_tables.h"
23#include "base/files/file_path.h"
24#include "base/memory/scoped_ptr.h"
25#include "base/memory/weak_ptr.h"
26#include "base/message_loop/message_loop_proxy.h"
27#include "base/threading/non_thread_safe.h"
28#include "base/time/time.h"
29#include "net/base/cache_type.h"
30#include "net/base/completion_callback.h"
31#include "net/base/load_states.h"
32#include "net/base/net_export.h"
33#include "net/base/request_priority.h"
34#include "net/http/http_network_session.h"
35#include "net/http/http_transaction_factory.h"
36
37class GURL;
38
39namespace disk_cache {
40class Backend;
41class Entry;
42}
43
44namespace net {
45
46class CertVerifier;
47class HostResolver;
48class HttpAuthHandlerFactory;
49class HttpNetworkSession;
50class HttpResponseInfo;
51class HttpServerProperties;
52class IOBuffer;
53class NetLog;
54class NetworkDelegate;
55class ServerBoundCertService;
56class ProxyService;
57class SSLConfigService;
58class TransportSecurityState;
59class ViewCacheHelper;
60struct HttpRequestInfo;
61
62class NET_EXPORT HttpCache : public HttpTransactionFactory,
63                             public base::SupportsWeakPtr<HttpCache>,
64                             NON_EXPORTED_BASE(public base::NonThreadSafe) {
65 public:
66  // The cache mode of operation.
67  enum Mode {
68    // Normal mode just behaves like a standard web cache.
69    NORMAL = 0,
70    // Record mode caches everything for purposes of offline playback.
71    RECORD,
72    // Playback mode replays from a cache without considering any
73    // standard invalidations.
74    PLAYBACK,
75    // Disables reads and writes from the cache.
76    // Equivalent to setting LOAD_DISABLE_CACHE on every request.
77    DISABLE
78  };
79
80  // A BackendFactory creates a backend object to be used by the HttpCache.
81  class NET_EXPORT BackendFactory {
82   public:
83    virtual ~BackendFactory() {}
84
85    // The actual method to build the backend. Returns a net error code. If
86    // ERR_IO_PENDING is returned, the |callback| will be notified when the
87    // operation completes, and |backend| must remain valid until the
88    // notification arrives.
89    // The implementation must not access the factory object after invoking the
90    // |callback| because the object can be deleted from within the callback.
91    virtual int CreateBackend(NetLog* net_log,
92                              scoped_ptr<disk_cache::Backend>* backend,
93                              const CompletionCallback& callback) = 0;
94  };
95
96  // A default backend factory for the common use cases.
97  class NET_EXPORT DefaultBackend : public BackendFactory {
98   public:
99    // |path| is the destination for any files used by the backend, and
100    // |cache_thread| is the thread where disk operations should take place. If
101    // |max_bytes| is  zero, a default value will be calculated automatically.
102    DefaultBackend(CacheType type, BackendType backend_type,
103                   const base::FilePath& path, int max_bytes,
104                   base::MessageLoopProxy* thread);
105    virtual ~DefaultBackend();
106
107    // Returns a factory for an in-memory cache.
108    static BackendFactory* InMemory(int max_bytes);
109
110    // BackendFactory implementation.
111    virtual int CreateBackend(NetLog* net_log,
112                              scoped_ptr<disk_cache::Backend>* backend,
113                              const CompletionCallback& callback) OVERRIDE;
114
115   private:
116    CacheType type_;
117    BackendType backend_type_;
118    const base::FilePath path_;
119    int max_bytes_;
120    scoped_refptr<base::MessageLoopProxy> thread_;
121  };
122
123  // The disk cache is initialized lazily (by CreateTransaction) in this case.
124  // The HttpCache takes ownership of the |backend_factory|.
125  HttpCache(const net::HttpNetworkSession::Params& params,
126            BackendFactory* backend_factory);
127
128  // The disk cache is initialized lazily (by CreateTransaction) in  this case.
129  // Provide an existing HttpNetworkSession, the cache can construct a
130  // network layer with a shared HttpNetworkSession in order for multiple
131  // network layers to share information (e.g. authentication data). The
132  // HttpCache takes ownership of the |backend_factory|.
133  HttpCache(HttpNetworkSession* session, BackendFactory* backend_factory);
134
135  // Initialize the cache from its component parts, which is useful for
136  // testing.  The lifetime of the network_layer and backend_factory are managed
137  // by the HttpCache and will be destroyed using |delete| when the HttpCache is
138  // destroyed.
139  HttpCache(HttpTransactionFactory* network_layer,
140            NetLog* net_log,
141            BackendFactory* backend_factory);
142
143  virtual ~HttpCache();
144
145  HttpTransactionFactory* network_layer() { return network_layer_.get(); }
146
147  // Retrieves the cache backend for this HttpCache instance. If the backend
148  // is not initialized yet, this method will initialize it. The return value is
149  // a network error code, and it could be ERR_IO_PENDING, in which case the
150  // |callback| will be notified when the operation completes. The pointer that
151  // receives the |backend| must remain valid until the operation completes.
152  int GetBackend(disk_cache::Backend** backend,
153                 const net::CompletionCallback& callback);
154
155  // Returns the current backend (can be NULL).
156  disk_cache::Backend* GetCurrentBackend() const;
157
158  // Given a header data blob, convert it to a response info object.
159  static bool ParseResponseInfo(const char* data, int len,
160                                HttpResponseInfo* response_info,
161                                bool* response_truncated);
162
163  // Writes |buf_len| bytes of metadata stored in |buf| to the cache entry
164  // referenced by |url|, as long as the entry's |expected_response_time| has
165  // not changed. This method returns without blocking, and the operation will
166  // be performed asynchronously without any completion notification.
167  void WriteMetadata(const GURL& url,
168                     RequestPriority priority,
169                     base::Time expected_response_time,
170                     IOBuffer* buf,
171                     int buf_len);
172
173  // Get/Set the cache's mode.
174  void set_mode(Mode value) { mode_ = value; }
175  Mode mode() { return mode_; }
176
177  // Close currently active sockets so that fresh page loads will not use any
178  // recycled connections.  For sockets currently in use, they may not close
179  // immediately, but they will not be reusable. This is for debugging.
180  void CloseAllConnections();
181
182  // Close all idle connections. Will close all sockets not in active use.
183  void CloseIdleConnections();
184
185  // Called whenever an external cache in the system reuses the resource
186  // referred to by |url| and |http_method|.
187  void OnExternalCacheHit(const GURL& url, const std::string& http_method);
188
189  // Initializes the Infinite Cache, if selected by the field trial.
190  void InitializeInfiniteCache(const base::FilePath& path);
191
192  // HttpTransactionFactory implementation:
193  virtual int CreateTransaction(RequestPriority priority,
194                                scoped_ptr<HttpTransaction>* trans,
195                                HttpTransactionDelegate* delegate) OVERRIDE;
196  virtual HttpCache* GetCache() OVERRIDE;
197  virtual HttpNetworkSession* GetSession() OVERRIDE;
198
199 protected:
200  // Disk cache entry data indices.
201  enum {
202    kResponseInfoIndex = 0,
203    kResponseContentIndex,
204    kMetadataIndex,
205
206    // Must remain at the end of the enum.
207    kNumCacheEntryDataIndices
208  };
209  friend class ViewCacheHelper;
210
211 private:
212  // Types --------------------------------------------------------------------
213
214  class MetadataWriter;
215  class Transaction;
216  class WorkItem;
217  friend class Transaction;
218  struct PendingOp;  // Info for an entry under construction.
219
220  typedef std::list<Transaction*> TransactionList;
221  typedef std::list<WorkItem*> WorkItemList;
222
223  struct ActiveEntry {
224    explicit ActiveEntry(disk_cache::Entry* entry);
225    ~ActiveEntry();
226
227    disk_cache::Entry* disk_entry;
228    Transaction*       writer;
229    TransactionList    readers;
230    TransactionList    pending_queue;
231    bool               will_process_pending_queue;
232    bool               doomed;
233  };
234
235  typedef base::hash_map<std::string, ActiveEntry*> ActiveEntriesMap;
236  typedef base::hash_map<std::string, PendingOp*> PendingOpsMap;
237  typedef std::set<ActiveEntry*> ActiveEntriesSet;
238  typedef base::hash_map<std::string, int> PlaybackCacheMap;
239
240  // Methods ------------------------------------------------------------------
241
242  // Creates the |backend| object and notifies the |callback| when the operation
243  // completes. Returns an error code.
244  int CreateBackend(disk_cache::Backend** backend,
245                    const net::CompletionCallback& callback);
246
247  // Makes sure that the backend creation is complete before allowing the
248  // provided transaction to use the object. Returns an error code.  |trans|
249  // will be notified via its IO callback if this method returns ERR_IO_PENDING.
250  // The transaction is free to use the backend directly at any time after
251  // receiving the notification.
252  int GetBackendForTransaction(Transaction* trans);
253
254  // Generates the cache key for this request.
255  std::string GenerateCacheKey(const HttpRequestInfo*);
256
257  // Dooms the entry selected by |key|, if it is currently in the list of active
258  // entries.
259  void DoomActiveEntry(const std::string& key);
260
261  // Dooms the entry selected by |key|. |trans| will be notified via its IO
262  // callback if this method returns ERR_IO_PENDING. The entry can be
263  // currently in use or not.
264  int DoomEntry(const std::string& key, Transaction* trans);
265
266  // Dooms the entry selected by |key|. |trans| will be notified via its IO
267  // callback if this method returns ERR_IO_PENDING. The entry should not
268  // be currently in use.
269  int AsyncDoomEntry(const std::string& key, Transaction* trans);
270
271  // Dooms the entry associated with a GET for a given |url|.
272  void DoomMainEntryForUrl(const GURL& url);
273
274  // Closes a previously doomed entry.
275  void FinalizeDoomedEntry(ActiveEntry* entry);
276
277  // Returns an entry that is currently in use and not doomed, or NULL.
278  ActiveEntry* FindActiveEntry(const std::string& key);
279
280  // Creates a new ActiveEntry and starts tracking it. |disk_entry| is the disk
281  // cache entry.
282  ActiveEntry* ActivateEntry(disk_cache::Entry* disk_entry);
283
284  // Deletes an ActiveEntry.
285  void DeactivateEntry(ActiveEntry* entry);
286
287  // Deletes an ActiveEntry using an exhaustive search.
288  void SlowDeactivateEntry(ActiveEntry* entry);
289
290  // Returns the PendingOp for the desired |key|. If an entry is not under
291  // construction already, a new PendingOp structure is created.
292  PendingOp* GetPendingOp(const std::string& key);
293
294  // Deletes a PendingOp.
295  void DeletePendingOp(PendingOp* pending_op);
296
297  // Opens the disk cache entry associated with |key|, returning an ActiveEntry
298  // in |*entry|. |trans| will be notified via its IO callback if this method
299  // returns ERR_IO_PENDING.
300  int OpenEntry(const std::string& key, ActiveEntry** entry,
301                Transaction* trans);
302
303  // Creates the disk cache entry associated with |key|, returning an
304  // ActiveEntry in |*entry|. |trans| will be notified via its IO callback if
305  // this method returns ERR_IO_PENDING.
306  int CreateEntry(const std::string& key, ActiveEntry** entry,
307                  Transaction* trans);
308
309  // Destroys an ActiveEntry (active or doomed).
310  void DestroyEntry(ActiveEntry* entry);
311
312  // Adds a transaction to an ActiveEntry. If this method returns ERR_IO_PENDING
313  // the transaction will be notified about completion via its IO callback. This
314  // method returns ERR_CACHE_RACE to signal the transaction that it cannot be
315  // added to the provided entry, and it should retry the process with another
316  // one (in this case, the entry is no longer valid).
317  int AddTransactionToEntry(ActiveEntry* entry, Transaction* trans);
318
319  // Called when the transaction has finished working with this entry. |cancel|
320  // is true if the operation was cancelled by the caller instead of running
321  // to completion.
322  void DoneWithEntry(ActiveEntry* entry, Transaction* trans, bool cancel);
323
324  // Called when the transaction has finished writing to this entry. |success|
325  // is false if the cache entry should be deleted.
326  void DoneWritingToEntry(ActiveEntry* entry, bool success);
327
328  // Called when the transaction has finished reading from this entry.
329  void DoneReadingFromEntry(ActiveEntry* entry, Transaction* trans);
330
331  // Converts the active writer transaction to a reader so that other
332  // transactions can start reading from this entry.
333  void ConvertWriterToReader(ActiveEntry* entry);
334
335  // Returns the LoadState of the provided pending transaction.
336  LoadState GetLoadStateForPendingTransaction(const Transaction* trans);
337
338  // Removes the transaction |trans|, from the pending list of an entry
339  // (PendingOp, active or doomed entry).
340  void RemovePendingTransaction(Transaction* trans);
341
342  // Removes the transaction |trans|, from the pending list of |entry|.
343  bool RemovePendingTransactionFromEntry(ActiveEntry* entry,
344                                         Transaction* trans);
345
346  // Removes the transaction |trans|, from the pending list of |pending_op|.
347  bool RemovePendingTransactionFromPendingOp(PendingOp* pending_op,
348                                             Transaction* trans);
349
350  // Resumes processing the pending list of |entry|.
351  void ProcessPendingQueue(ActiveEntry* entry);
352
353  // Events (called via PostTask) ---------------------------------------------
354
355  void OnProcessPendingQueue(ActiveEntry* entry);
356
357  // Callbacks ----------------------------------------------------------------
358
359  // Processes BackendCallback notifications.
360  void OnIOComplete(int result, PendingOp* entry);
361
362  // Helper to conditionally delete |pending_op| if the HttpCache object it
363  // is meant for has been deleted.
364  //
365  // TODO(ajwong): The PendingOp lifetime management is very tricky.  It might
366  // be possible to simplify it using either base::Owned() or base::Passed()
367  // with the callback.
368  static void OnPendingOpComplete(const base::WeakPtr<HttpCache>& cache,
369                                  PendingOp* pending_op,
370                                  int result);
371
372  // Processes the backend creation notification.
373  void OnBackendCreated(int result, PendingOp* pending_op);
374
375  // Variables ----------------------------------------------------------------
376
377  NetLog* net_log_;
378
379  // Used when lazily constructing the disk_cache_.
380  scoped_ptr<BackendFactory> backend_factory_;
381  bool building_backend_;
382
383  Mode mode_;
384
385  const scoped_ptr<HttpTransactionFactory> network_layer_;
386  scoped_ptr<disk_cache::Backend> disk_cache_;
387
388  // The set of active entries indexed by cache key.
389  ActiveEntriesMap active_entries_;
390
391  // The set of doomed entries.
392  ActiveEntriesSet doomed_entries_;
393
394  // The set of entries "under construction".
395  PendingOpsMap pending_ops_;
396
397  scoped_ptr<PlaybackCacheMap> playback_cache_map_;
398
399  DISALLOW_COPY_AND_ASSIGN(HttpCache);
400};
401
402}  // namespace net
403
404#endif  // NET_HTTP_HTTP_CACHE_H_
405