Home | History | Annotate | Download | only in db
      1 // Copyright (c) 2011 The LevelDB Authors. All rights reserved.
      2 // Use of this source code is governed by a BSD-style license that can be
      3 // found in the LICENSE file. See the AUTHORS file for names of contributors.
      4 
      5 #ifndef STORAGE_LEVELDB_DB_FORMAT_H_
      6 #define STORAGE_LEVELDB_DB_FORMAT_H_
      7 
      8 #include <stdio.h>
      9 #include "leveldb/comparator.h"
     10 #include "leveldb/db.h"
     11 #include "leveldb/filter_policy.h"
     12 #include "leveldb/slice.h"
     13 #include "leveldb/table_builder.h"
     14 #include "util/coding.h"
     15 #include "util/logging.h"
     16 
     17 namespace leveldb {
     18 
     19 // Grouping of constants.  We may want to make some of these
     20 // parameters set via options.
     21 namespace config {
     22 static const int kNumLevels = 7;
     23 
     24 // Level-0 compaction is started when we hit this many files.
     25 static const int kL0_CompactionTrigger = 4;
     26 
     27 // Soft limit on number of level-0 files.  We slow down writes at this point.
     28 static const int kL0_SlowdownWritesTrigger = 8;
     29 
     30 // Maximum number of level-0 files.  We stop writes at this point.
     31 static const int kL0_StopWritesTrigger = 12;
     32 
     33 // Maximum level to which a new compacted memtable is pushed if it
     34 // does not create overlap.  We try to push to level 2 to avoid the
     35 // relatively expensive level 0=>1 compactions and to avoid some
     36 // expensive manifest file operations.  We do not push all the way to
     37 // the largest level since that can generate a lot of wasted disk
     38 // space if the same key space is being repeatedly overwritten.
     39 static const int kMaxMemCompactLevel = 2;
     40 
     41 // Approximate gap in bytes between samples of data read during iteration.
     42 static const int kReadBytesPeriod = 1048576;
     43 
     44 }  // namespace config
     45 
     46 class InternalKey;
     47 
     48 // Value types encoded as the last component of internal keys.
     49 // DO NOT CHANGE THESE ENUM VALUES: they are embedded in the on-disk
     50 // data structures.
     51 enum ValueType {
     52   kTypeDeletion = 0x0,
     53   kTypeValue = 0x1
     54 };
     55 // kValueTypeForSeek defines the ValueType that should be passed when
     56 // constructing a ParsedInternalKey object for seeking to a particular
     57 // sequence number (since we sort sequence numbers in decreasing order
     58 // and the value type is embedded as the low 8 bits in the sequence
     59 // number in internal keys, we need to use the highest-numbered
     60 // ValueType, not the lowest).
     61 static const ValueType kValueTypeForSeek = kTypeValue;
     62 
     63 typedef uint64_t SequenceNumber;
     64 
     65 // We leave eight bits empty at the bottom so a type and sequence#
     66 // can be packed together into 64-bits.
     67 static const SequenceNumber kMaxSequenceNumber =
     68     ((0x1ull << 56) - 1);
     69 
     70 struct ParsedInternalKey {
     71   Slice user_key;
     72   SequenceNumber sequence;
     73   ValueType type;
     74 
     75   ParsedInternalKey() { }  // Intentionally left uninitialized (for speed)
     76   ParsedInternalKey(const Slice& u, const SequenceNumber& seq, ValueType t)
     77       : user_key(u), sequence(seq), type(t) { }
     78   std::string DebugString() const;
     79 };
     80 
     81 // Return the length of the encoding of "key".
     82 inline size_t InternalKeyEncodingLength(const ParsedInternalKey& key) {
     83   return key.user_key.size() + 8;
     84 }
     85 
     86 // Append the serialization of "key" to *result.
     87 extern void AppendInternalKey(std::string* result,
     88                               const ParsedInternalKey& key);
     89 
     90 // Attempt to parse an internal key from "internal_key".  On success,
     91 // stores the parsed data in "*result", and returns true.
     92 //
     93 // On error, returns false, leaves "*result" in an undefined state.
     94 extern bool ParseInternalKey(const Slice& internal_key,
     95                              ParsedInternalKey* result);
     96 
     97 // Returns the user key portion of an internal key.
     98 inline Slice ExtractUserKey(const Slice& internal_key) {
     99   assert(internal_key.size() >= 8);
    100   return Slice(internal_key.data(), internal_key.size() - 8);
    101 }
    102 
    103 inline ValueType ExtractValueType(const Slice& internal_key) {
    104   assert(internal_key.size() >= 8);
    105   const size_t n = internal_key.size();
    106   uint64_t num = DecodeFixed64(internal_key.data() + n - 8);
    107   unsigned char c = num & 0xff;
    108   return static_cast<ValueType>(c);
    109 }
    110 
    111 // A comparator for internal keys that uses a specified comparator for
    112 // the user key portion and breaks ties by decreasing sequence number.
    113 class InternalKeyComparator : public Comparator {
    114  private:
    115   const Comparator* user_comparator_;
    116  public:
    117   explicit InternalKeyComparator(const Comparator* c) : user_comparator_(c) { }
    118   virtual const char* Name() const;
    119   virtual int Compare(const Slice& a, const Slice& b) const;
    120   virtual void FindShortestSeparator(
    121       std::string* start,
    122       const Slice& limit) const;
    123   virtual void FindShortSuccessor(std::string* key) const;
    124 
    125   const Comparator* user_comparator() const { return user_comparator_; }
    126 
    127   int Compare(const InternalKey& a, const InternalKey& b) const;
    128 };
    129 
    130 // Filter policy wrapper that converts from internal keys to user keys
    131 class InternalFilterPolicy : public FilterPolicy {
    132  private:
    133   const FilterPolicy* const user_policy_;
    134  public:
    135   explicit InternalFilterPolicy(const FilterPolicy* p) : user_policy_(p) { }
    136   virtual const char* Name() const;
    137   virtual void CreateFilter(const Slice* keys, int n, std::string* dst) const;
    138   virtual bool KeyMayMatch(const Slice& key, const Slice& filter) const;
    139 };
    140 
    141 // Modules in this directory should keep internal keys wrapped inside
    142 // the following class instead of plain strings so that we do not
    143 // incorrectly use string comparisons instead of an InternalKeyComparator.
    144 class InternalKey {
    145  private:
    146   std::string rep_;
    147  public:
    148   InternalKey() { }   // Leave rep_ as empty to indicate it is invalid
    149   InternalKey(const Slice& user_key, SequenceNumber s, ValueType t) {
    150     AppendInternalKey(&rep_, ParsedInternalKey(user_key, s, t));
    151   }
    152 
    153   void DecodeFrom(const Slice& s) { rep_.assign(s.data(), s.size()); }
    154   Slice Encode() const {
    155     assert(!rep_.empty());
    156     return rep_;
    157   }
    158 
    159   Slice user_key() const { return ExtractUserKey(rep_); }
    160 
    161   void SetFrom(const ParsedInternalKey& p) {
    162     rep_.clear();
    163     AppendInternalKey(&rep_, p);
    164   }
    165 
    166   void Clear() { rep_.clear(); }
    167 
    168   std::string DebugString() const;
    169 };
    170 
    171 inline int InternalKeyComparator::Compare(
    172     const InternalKey& a, const InternalKey& b) const {
    173   return Compare(a.Encode(), b.Encode());
    174 }
    175 
    176 inline bool ParseInternalKey(const Slice& internal_key,
    177                              ParsedInternalKey* result) {
    178   const size_t n = internal_key.size();
    179   if (n < 8) return false;
    180   uint64_t num = DecodeFixed64(internal_key.data() + n - 8);
    181   unsigned char c = num & 0xff;
    182   result->sequence = num >> 8;
    183   result->type = static_cast<ValueType>(c);
    184   result->user_key = Slice(internal_key.data(), n - 8);
    185   return (c <= static_cast<unsigned char>(kTypeValue));
    186 }
    187 
    188 // A helper class useful for DBImpl::Get()
    189 class LookupKey {
    190  public:
    191   // Initialize *this for looking up user_key at a snapshot with
    192   // the specified sequence number.
    193   LookupKey(const Slice& user_key, SequenceNumber sequence);
    194 
    195   ~LookupKey();
    196 
    197   // Return a key suitable for lookup in a MemTable.
    198   Slice memtable_key() const { return Slice(start_, end_ - start_); }
    199 
    200   // Return an internal key (suitable for passing to an internal iterator)
    201   Slice internal_key() const { return Slice(kstart_, end_ - kstart_); }
    202 
    203   // Return the user key
    204   Slice user_key() const { return Slice(kstart_, end_ - kstart_ - 8); }
    205 
    206  private:
    207   // We construct a char array of the form:
    208   //    klength  varint32               <-- start_
    209   //    userkey  char[klength]          <-- kstart_
    210   //    tag      uint64
    211   //                                    <-- end_
    212   // The array is a suitable MemTable key.
    213   // The suffix starting with "userkey" can be used as an InternalKey.
    214   const char* start_;
    215   const char* kstart_;
    216   const char* end_;
    217   char space_[200];      // Avoid allocation for short keys
    218 
    219   // No copying allowed
    220   LookupKey(const LookupKey&);
    221   void operator=(const LookupKey&);
    222 };
    223 
    224 inline LookupKey::~LookupKey() {
    225   if (start_ != space_) delete[] start_;
    226 }
    227 
    228 }  // namespace leveldb
    229 
    230 #endif  // STORAGE_LEVELDB_DB_FORMAT_H_
    231