Home | History | Annotate | Download | only in v3
      1 // Copyright (c) 2011 The Chromium Authors. All rights reserved.
      2 // Use of this source code is governed by a BSD-style license that can be
      3 // found in the LICENSE file.
      4 
      5 // The cache is stored on disk as a collection of block-files, plus an index
      6 // plus a collection of external files.
      7 //
      8 // Any data blob bigger than kMaxBlockSize (disk_cache/addr.h) will be stored in
      9 // a separate file named f_xxx where x is a hexadecimal number. Shorter data
     10 // will be stored as a series of blocks on a block-file. In any case, CacheAddr
     11 // represents the address of the data inside the cache.
     12 //
     13 // The index is actually a collection of four files that store a hash table with
     14 // allocation bitmaps and backup data. Hash collisions are handled directly by
     15 // the table, which from some point of view behaves like a 4-way associative
     16 // cache with overflow buckets (so not really open addressing).
     17 //
     18 // Basically the hash table is a collection of buckets. The first part of the
     19 // table has a fixed number of buckets and it is directly addressed by the hash,
     20 // while the second part of the table (stored on a second file) has a variable
     21 // number of buckets. Each bucket stores up to four cells (each cell represents
     22 // a possibl entry). The index bitmap tracks the state of individual cells.
     23 //
     24 // The last element of the cache is the block-file. A block file is a file
     25 // designed to store blocks of data of a given size. For more details see
     26 // disk_cache/disk_format_base.h
     27 //
     28 // A new cache is initialized with a set of block files (named data_0 through
     29 // data_6), each one dedicated to store blocks of a given size or function. The
     30 // number at the end of the file name is the block file number (in decimal).
     31 //
     32 // There are three "special" types of blocks: normal entries, evicted entries
     33 // and control data for external files.
     34 //
     35 // The files that store internal information for the cache (blocks and index)
     36 // are memory mapped. They have a location that is signaled every time the
     37 // internal structures are modified, so it is possible to detect (most of the
     38 // time) when the process dies in the middle of an update. There are dedicated
     39 // backup files for cache bitmaps, used to detect entries out of date.
     40 
     41 #ifndef NET_DISK_CACHE_V3_DISK_FORMAT_V3_H_
     42 #define NET_DISK_CACHE_V3_DISK_FORMAT_V3_H_
     43 
     44 #include "base/basictypes.h"
     45 #include "net/disk_cache/disk_format_base.h"
     46 
     47 namespace disk_cache {
     48 
     49 const int kBaseTableLen = 0x10000;
     50 const uint32 kIndexMagicV3 = 0xC103CAC3;
     51 const uint32 kVersion3 = 0x30000;  // Version 3.0.
     52 
     53 // Flags for a given cache.
     54 enum CacheFlags {
     55   CACHE_EVICTION_2 = 1,      // Keep multiple lists for eviction.
     56   CACHE_EVICTED = 1 << 1     // Already evicted at least one entry.
     57 };
     58 
     59 // Header for the master index file.
     60 struct IndexHeaderV3 {
     61   uint32      magic;
     62   uint32      version;
     63   int32       num_entries;   // Number of entries currently stored.
     64   int32       num_bytes;     // Total size of the stored data.
     65   int32       last_file;     // Last external file created.
     66   int32       reserved1;
     67   CacheAddr   stats;         // Storage for usage data.
     68   int32       table_len;     // Actual size of the table.
     69   int32       crash;         // Signals a previous crash.
     70   int32       experiment;    // Id of an ongoing test.
     71   int32       max_bytes;     // Total maximum size of the stored data.
     72   uint32      flags;
     73   int32       used_cells;
     74   int32       max_bucket;
     75   uint64      create_time;   // Creation time for this set of files.
     76   uint64      base_time;     // Current base for timestamps.
     77   uint64      old_time;      // Previous time used for timestamps.
     78   int32       max_block_file;
     79   int32       num_no_use_entries;
     80   int32       num_low_use_entries;
     81   int32       num_high_use_entries;
     82   int32       reserved;
     83   int32       num_evicted_entries;
     84   int32       pad[6];
     85 };
     86 
     87 const int kBaseBitmapBytes = 3968;
     88 // The IndexBitmap is directly saved to a file named index. The file grows in
     89 // page increments (4096 bytes), but all bits don't have to be in use at any
     90 // given time. The required file size can be computed from header.table_len.
     91 struct IndexBitmap {
     92   IndexHeaderV3   header;
     93   uint32          bitmap[kBaseBitmapBytes / 4];  // First page of the bitmap.
     94 };
     95 COMPILE_ASSERT(sizeof(IndexBitmap) == 4096, bad_IndexHeader);
     96 
     97 // Possible states for a given entry.
     98 enum EntryState {
     99   ENTRY_FREE = 0,   // Available slot.
    100   ENTRY_NEW,        // The entry is being created.
    101   ENTRY_OPEN,       // The entry is being accessed.
    102   ENTRY_MODIFIED,   // The entry is being modified.
    103   ENTRY_DELETED,    // The entry is being deleted.
    104   ENTRY_FIXING,     // Inconsistent state. The entry is being verified.
    105   ENTRY_USED        // The slot is in use (entry is present).
    106 };
    107 COMPILE_ASSERT(ENTRY_USED <= 7, state_uses_3_bits);
    108 
    109 enum EntryGroup {
    110   ENTRY_NO_USE = 0,   // The entry has not been reused.
    111   ENTRY_LOW_USE,      // The entry has low reuse.
    112   ENTRY_HIGH_USE,     // The entry has high reuse.
    113   ENTRY_RESERVED,     // Reserved for future use.
    114   ENTRY_EVICTED       // The entry was deleted.
    115 };
    116 COMPILE_ASSERT(ENTRY_USED <= 7, group_uses_3_bits);
    117 
    118 #pragma pack(push, 1)
    119 struct IndexCell {
    120   void Clear() { memset(this, 0, sizeof(*this)); }
    121 
    122   uint64      address : 22;
    123   uint64      hash : 18;
    124   uint64      timestamp : 20;
    125   uint64      reuse : 4;
    126   uint8       state : 3;
    127   uint8       group : 3;
    128   uint8       sum : 2;
    129 };
    130 COMPILE_ASSERT(sizeof(IndexCell) == 9, bad_IndexCell);
    131 
    132 struct IndexBucket {
    133   IndexCell   cells[4];
    134   int32       next;
    135   uint32      hash : 24;      // The last byte is only defined for buckets of
    136   uint32      reserved : 8;   // the extra table.
    137 };
    138 COMPILE_ASSERT(sizeof(IndexBucket) == 44, bad_IndexBucket);
    139 const int kBytesPerCell = 44 / 4;
    140 
    141 // The main cache index. Backed by a file named index_tb1.
    142 // The extra table (index_tb2) has a similar format, but different size.
    143 struct Index {
    144   // Default size. Actual size controlled by header.table_len.
    145   IndexBucket table[kBaseTableLen / 4];
    146 };
    147 #pragma pack(pop)
    148 
    149 // Flags that can be applied to an entry.
    150 enum EntryFlags {
    151   PARENT_ENTRY = 1,         // This entry has children (sparse) entries.
    152   CHILD_ENTRY = 1 << 1      // Child entry that stores sparse data.
    153 };
    154 
    155 struct EntryRecord {
    156   uint32      hash;
    157   uint32      pad1;
    158   uint8       reuse_count;
    159   uint8       refetch_count;
    160   int8        state;              // Current EntryState.
    161   uint8       flags;              // Any combination of EntryFlags.
    162   int32       key_len;
    163   int32       data_size[4];       // We can store up to 4 data streams for each
    164   CacheAddr   data_addr[4];       // entry.
    165   uint32      data_hash[4];
    166   uint64      creation_time;
    167   uint64      last_modified_time;
    168   uint64      last_access_time;
    169   int32       pad[3];
    170   uint32      self_hash;
    171 };
    172 COMPILE_ASSERT(sizeof(EntryRecord) == 104, bad_EntryRecord);
    173 
    174 struct ShortEntryRecord {
    175   uint32      hash;
    176   uint32      pad1;
    177   uint8       reuse_count;
    178   uint8       refetch_count;
    179   int8        state;              // Current EntryState.
    180   uint8       flags;
    181   int32       key_len;
    182   uint64      last_access_time;
    183   uint32      long_hash[5];
    184   uint32      self_hash;
    185 };
    186 COMPILE_ASSERT(sizeof(ShortEntryRecord) == 48, bad_ShortEntryRecord);
    187 
    188 }  // namespace disk_cache
    189 
    190 #endif  // NET_DISK_CACHE_V3_DISK_FORMAT_V3_H_
    191