Home | History | Annotate | Download | only in metrics
      1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.
      2 // Use of this source code is governed by a BSD-style license that can be
      3 // found in the LICENSE file.
      4 
      5 // Histogram is an object that aggregates statistics, and can summarize them in
      6 // various forms, including ASCII graphical, HTML, and numerically (as a
      7 // vector of numbers corresponding to each of the aggregating buckets).
      8 
      9 // It supports calls to accumulate either time intervals (which are processed
     10 // as integral number of milliseconds), or arbitrary integral units.
     11 
     12 // For Histogram(exponential histogram), LinearHistogram and CustomHistogram,
     13 // the minimum for a declared range is 1 (instead of 0), while the maximum is
     14 // (HistogramBase::kSampleType_MAX - 1). Currently you can declare histograms
     15 // with ranges exceeding those limits (e.g. 0 as minimal or
     16 // HistogramBase::kSampleType_MAX as maximal), but those excesses will be
     17 // silently clamped to those limits (for backwards compatibility with existing
     18 // code). Best practice is to not exceed the limits.
     19 
     20 // Each use of a histogram with the same name will reference the same underlying
     21 // data, so it is safe to record to the same histogram from multiple locations
     22 // in the code. It is a runtime error if all uses of the same histogram do not
     23 // agree exactly in type, bucket size and range.
     24 
     25 // For Histogram and LinearHistogram, the maximum for a declared range should
     26 // always be larger (not equal) than minimal range. Zero and
     27 // HistogramBase::kSampleType_MAX are implicitly added as first and last ranges,
     28 // so the smallest legal bucket_count is 3. However CustomHistogram can have
     29 // bucket count as 2 (when you give a custom ranges vector containing only 1
     30 // range).
     31 // For these 3 kinds of histograms, the max bucket count is always
     32 // (Histogram::kBucketCount_MAX - 1).
     33 
     34 // The buckets layout of class Histogram is exponential. For example, buckets
     35 // might contain (sequentially) the count of values in the following intervals:
     36 // [0,1), [1,2), [2,4), [4,8), [8,16), [16,32), [32,64), [64,infinity)
     37 // That bucket allocation would actually result from construction of a histogram
     38 // for values between 1 and 64, with 8 buckets, such as:
     39 // Histogram count("some name", 1, 64, 8);
     40 // Note that the underflow bucket [0,1) and the overflow bucket [64,infinity)
     41 // are also counted by the constructor in the user supplied "bucket_count"
     42 // argument.
     43 // The above example has an exponential ratio of 2 (doubling the bucket width
     44 // in each consecutive bucket.  The Histogram class automatically calculates
     45 // the smallest ratio that it can use to construct the number of buckets
     46 // selected in the constructor.  An another example, if you had 50 buckets,
     47 // and millisecond time values from 1 to 10000, then the ratio between
     48 // consecutive bucket widths will be approximately somewhere around the 50th
     49 // root of 10000.  This approach provides very fine grain (narrow) buckets
     50 // at the low end of the histogram scale, but allows the histogram to cover a
     51 // gigantic range with the addition of very few buckets.
     52 
     53 // Usually we use macros to define and use a histogram. These macros use a
     54 // pattern involving a function static variable, that is a pointer to a
     55 // histogram.  This static is explicitly initialized on any thread
     56 // that detects a uninitialized (NULL) pointer.  The potentially racy
     57 // initialization is not a problem as it is always set to point to the same
     58 // value (i.e., the FactoryGet always returns the same value).  FactoryGet
     59 // is also completely thread safe, which results in a completely thread safe,
     60 // and relatively fast, set of counters.  To avoid races at shutdown, the static
     61 // pointer is NOT deleted, and we leak the histograms at process termination.
     62 
     63 #ifndef BASE_METRICS_HISTOGRAM_H_
     64 #define BASE_METRICS_HISTOGRAM_H_
     65 
     66 #include <map>
     67 #include <string>
     68 #include <vector>
     69 
     70 #include "base/atomicops.h"
     71 #include "base/base_export.h"
     72 #include "base/basictypes.h"
     73 #include "base/compiler_specific.h"
     74 #include "base/gtest_prod_util.h"
     75 #include "base/logging.h"
     76 #include "base/memory/scoped_ptr.h"
     77 #include "base/metrics/bucket_ranges.h"
     78 #include "base/metrics/histogram_base.h"
     79 #include "base/metrics/histogram_samples.h"
     80 #include "base/time/time.h"
     81 
     82 class Pickle;
     83 class PickleIterator;
     84 
     85 namespace base {
     86 
     87 class Lock;
     88 //------------------------------------------------------------------------------
     89 // Histograms are often put in areas where they are called many many times, and
     90 // performance is critical.  As a result, they are designed to have a very low
     91 // recurring cost of executing (adding additional samples).  Toward that end,
     92 // the macros declare a static pointer to the histogram in question, and only
     93 // take a "slow path" to construct (or find) the histogram on the first run
     94 // through the macro.  We leak the histograms at shutdown time so that we don't
     95 // have to validate using the pointers at any time during the running of the
     96 // process.
     97 
     98 // The following code is generally what a thread-safe static pointer
     99 // initialization looks like for a histogram (after a macro is expanded).  This
    100 // sample is an expansion (with comments) of the code for
    101 // HISTOGRAM_CUSTOM_COUNTS().
    102 
    103 /*
    104   do {
    105     // The pointer's presence indicates the initialization is complete.
    106     // Initialization is idempotent, so it can safely be atomically repeated.
    107     static base::subtle::AtomicWord atomic_histogram_pointer = 0;
    108 
    109     // Acquire_Load() ensures that we acquire visibility to the pointed-to data
    110     // in the histogram.
    111     base::Histogram* histogram_pointer(reinterpret_cast<base::Histogram*>(
    112         base::subtle::Acquire_Load(&atomic_histogram_pointer)));
    113 
    114     if (!histogram_pointer) {
    115       // This is the slow path, which will construct OR find the matching
    116       // histogram.  FactoryGet includes locks on a global histogram name map
    117       // and is completely thread safe.
    118       histogram_pointer = base::Histogram::FactoryGet(
    119           name, min, max, bucket_count, base::HistogramBase::kNoFlags);
    120 
    121       // Use Release_Store to ensure that the histogram data is made available
    122       // globally before we make the pointer visible.
    123       // Several threads may perform this store, but the same value will be
    124       // stored in all cases (for a given named/spec'ed histogram).
    125       // We could do this without any barrier, since FactoryGet entered and
    126       // exited a lock after construction, but this barrier makes things clear.
    127       base::subtle::Release_Store(&atomic_histogram_pointer,
    128           reinterpret_cast<base::subtle::AtomicWord>(histogram_pointer));
    129     }
    130 
    131     // Ensure calling contract is upheld, and the name does NOT vary.
    132     DCHECK(histogram_pointer->histogram_name() == constant_histogram_name);
    133 
    134     histogram_pointer->Add(sample);
    135   } while (0);
    136 */
    137 
    138 // The above pattern is repeated in several macros.  The only elements that
    139 // vary are the invocation of the Add(sample) vs AddTime(sample), and the choice
    140 // of which FactoryGet method to use.  The different FactoryGet methods have
    141 // various argument lists, so the function with its argument list is provided as
    142 // a macro argument here.  The name is only used in a DCHECK, to assure that
    143 // callers don't try to vary the name of the histogram (which would tend to be
    144 // ignored by the one-time initialization of the histogtram_pointer).
    145 #define STATIC_HISTOGRAM_POINTER_BLOCK(constant_histogram_name, \
    146                                        histogram_add_method_invocation, \
    147                                        histogram_factory_get_invocation) \
    148   do { \
    149     static base::subtle::AtomicWord atomic_histogram_pointer = 0; \
    150     base::HistogramBase* histogram_pointer( \
    151         reinterpret_cast<base::HistogramBase*>( \
    152             base::subtle::Acquire_Load(&atomic_histogram_pointer))); \
    153     if (!histogram_pointer) { \
    154       histogram_pointer = histogram_factory_get_invocation; \
    155       base::subtle::Release_Store(&atomic_histogram_pointer, \
    156           reinterpret_cast<base::subtle::AtomicWord>(histogram_pointer)); \
    157     } \
    158     DCHECK_EQ(histogram_pointer->histogram_name(), \
    159               std::string(constant_histogram_name)); \
    160     histogram_pointer->histogram_add_method_invocation; \
    161   } while (0)
    162 
    163 
    164 //------------------------------------------------------------------------------
    165 // Provide easy general purpose histogram in a macro, just like stats counters.
    166 // The first four macros use 50 buckets.
    167 
    168 #define HISTOGRAM_TIMES(name, sample) HISTOGRAM_CUSTOM_TIMES( \
    169     name, sample, base::TimeDelta::FromMilliseconds(1), \
    170     base::TimeDelta::FromSeconds(10), 50)
    171 
    172 // For folks that need real specific times, use this to select a precise range
    173 // of times you want plotted, and the number of buckets you want used.
    174 #define HISTOGRAM_CUSTOM_TIMES(name, sample, min, max, bucket_count) \
    175     STATIC_HISTOGRAM_POINTER_BLOCK(name, AddTime(sample), \
    176         base::Histogram::FactoryTimeGet(name, min, max, bucket_count, \
    177                                         base::HistogramBase::kNoFlags))
    178 
    179 #define HISTOGRAM_COUNTS(name, sample) HISTOGRAM_CUSTOM_COUNTS( \
    180     name, sample, 1, 1000000, 50)
    181 
    182 #define HISTOGRAM_COUNTS_100(name, sample) HISTOGRAM_CUSTOM_COUNTS( \
    183     name, sample, 1, 100, 50)
    184 
    185 #define HISTOGRAM_COUNTS_10000(name, sample) HISTOGRAM_CUSTOM_COUNTS( \
    186     name, sample, 1, 10000, 50)
    187 
    188 #define HISTOGRAM_CUSTOM_COUNTS(name, sample, min, max, bucket_count) \
    189     STATIC_HISTOGRAM_POINTER_BLOCK(name, Add(sample), \
    190         base::Histogram::FactoryGet(name, min, max, bucket_count, \
    191                                     base::HistogramBase::kNoFlags))
    192 
    193 #define HISTOGRAM_PERCENTAGE(name, under_one_hundred) \
    194     HISTOGRAM_ENUMERATION(name, under_one_hundred, 101)
    195 
    196 #define HISTOGRAM_BOOLEAN(name, sample) \
    197     STATIC_HISTOGRAM_POINTER_BLOCK(name, AddBoolean(sample), \
    198         base::BooleanHistogram::FactoryGet(name, base::Histogram::kNoFlags))
    199 
    200 // Support histograming of an enumerated value.  The samples should always be
    201 // strictly less than |boundary_value| -- this prevents you from running into
    202 // problems down the line if you add additional buckets to the histogram.  Note
    203 // also that, despite explicitly setting the minimum bucket value to |1| below,
    204 // it is fine for enumerated histograms to be 0-indexed -- this is because
    205 // enumerated histograms should never have underflow.
    206 #define HISTOGRAM_ENUMERATION(name, sample, boundary_value) \
    207     STATIC_HISTOGRAM_POINTER_BLOCK(name, Add(sample), \
    208         base::LinearHistogram::FactoryGet(name, 1, boundary_value, \
    209             boundary_value + 1, base::HistogramBase::kNoFlags))
    210 
    211 // Support histograming of an enumerated value. Samples should be one of the
    212 // std::vector<int> list provided via |custom_ranges|. See comments above
    213 // CustomRanges::FactoryGet about the requirement of |custom_ranges|.
    214 // You can use the helper function CustomHistogram::ArrayToCustomRanges to
    215 // transform a C-style array of valid sample values to a std::vector<int>.
    216 #define HISTOGRAM_CUSTOM_ENUMERATION(name, sample, custom_ranges) \
    217     STATIC_HISTOGRAM_POINTER_BLOCK(name, Add(sample), \
    218         base::CustomHistogram::FactoryGet(name, custom_ranges, \
    219                                           base::HistogramBase::kNoFlags))
    220 
    221 #define HISTOGRAM_MEMORY_KB(name, sample) HISTOGRAM_CUSTOM_COUNTS( \
    222     name, sample, 1000, 500000, 50)
    223 
    224 //------------------------------------------------------------------------------
    225 // Define Debug vs non-debug flavors of macros.
    226 #ifndef NDEBUG
    227 
    228 #define DHISTOGRAM_TIMES(name, sample) HISTOGRAM_TIMES(name, sample)
    229 #define DHISTOGRAM_COUNTS(name, sample) HISTOGRAM_COUNTS(name, sample)
    230 #define DHISTOGRAM_PERCENTAGE(name, under_one_hundred) HISTOGRAM_PERCENTAGE(\
    231     name, under_one_hundred)
    232 #define DHISTOGRAM_CUSTOM_TIMES(name, sample, min, max, bucket_count) \
    233     HISTOGRAM_CUSTOM_TIMES(name, sample, min, max, bucket_count)
    234 #define DHISTOGRAM_CLIPPED_TIMES(name, sample, min, max, bucket_count) \
    235     HISTOGRAM_CLIPPED_TIMES(name, sample, min, max, bucket_count)
    236 #define DHISTOGRAM_CUSTOM_COUNTS(name, sample, min, max, bucket_count) \
    237     HISTOGRAM_CUSTOM_COUNTS(name, sample, min, max, bucket_count)
    238 #define DHISTOGRAM_ENUMERATION(name, sample, boundary_value) \
    239     HISTOGRAM_ENUMERATION(name, sample, boundary_value)
    240 #define DHISTOGRAM_CUSTOM_ENUMERATION(name, sample, custom_ranges) \
    241     HISTOGRAM_CUSTOM_ENUMERATION(name, sample, custom_ranges)
    242 
    243 #else  // NDEBUG
    244 // Keep a mention of passed variables to avoid unused variable warnings in
    245 // release build if these variables are only used in macros.
    246 #define DISCARD_2_ARGUMENTS(a, b) \
    247   while (0) { \
    248     static_cast<void>(a); \
    249     static_cast<void>(b); \
    250  }
    251 #define DISCARD_3_ARGUMENTS(a, b, c) \
    252   while (0) { \
    253     static_cast<void>(a); \
    254     static_cast<void>(b); \
    255     static_cast<void>(c); \
    256  }
    257 #define DISCARD_5_ARGUMENTS(a, b, c, d ,e) \
    258   while (0) { \
    259     static_cast<void>(a); \
    260     static_cast<void>(b); \
    261     static_cast<void>(c); \
    262     static_cast<void>(d); \
    263     static_cast<void>(e); \
    264  }
    265 #define DHISTOGRAM_TIMES(name, sample) \
    266     DISCARD_2_ARGUMENTS(name, sample)
    267 
    268 #define DHISTOGRAM_COUNTS(name, sample) \
    269     DISCARD_2_ARGUMENTS(name, sample)
    270 
    271 #define DHISTOGRAM_PERCENTAGE(name, under_one_hundred) \
    272     DISCARD_2_ARGUMENTS(name, under_one_hundred)
    273 
    274 #define DHISTOGRAM_CUSTOM_TIMES(name, sample, min, max, bucket_count) \
    275     DISCARD_5_ARGUMENTS(name, sample, min, max, bucket_count)
    276 
    277 #define DHISTOGRAM_CLIPPED_TIMES(name, sample, min, max, bucket_count) \
    278     DISCARD_5_ARGUMENTS(name, sample, min, max, bucket_count)
    279 
    280 #define DHISTOGRAM_CUSTOM_COUNTS(name, sample, min, max, bucket_count) \
    281     DISCARD_5_ARGUMENTS(name, sample, min, max, bucket_count)
    282 
    283 #define DHISTOGRAM_ENUMERATION(name, sample, boundary_value) \
    284     DISCARD_3_ARGUMENTS(name, sample, boundary_value)
    285 
    286 #define DHISTOGRAM_CUSTOM_ENUMERATION(name, sample, custom_ranges) \
    287     DISCARD_3_ARGUMENTS(name, sample, custom_ranges)
    288 
    289 #endif  // NDEBUG
    290 
    291 //------------------------------------------------------------------------------
    292 // The following macros provide typical usage scenarios for callers that wish
    293 // to record histogram data, and have the data submitted/uploaded via UMA.
    294 // Not all systems support such UMA, but if they do, the following macros
    295 // should work with the service.
    296 
    297 #define UMA_HISTOGRAM_TIMES(name, sample) UMA_HISTOGRAM_CUSTOM_TIMES( \
    298     name, sample, base::TimeDelta::FromMilliseconds(1), \
    299     base::TimeDelta::FromSeconds(10), 50)
    300 
    301 #define UMA_HISTOGRAM_MEDIUM_TIMES(name, sample) UMA_HISTOGRAM_CUSTOM_TIMES( \
    302     name, sample, base::TimeDelta::FromMilliseconds(10), \
    303     base::TimeDelta::FromMinutes(3), 50)
    304 
    305 // Use this macro when times can routinely be much longer than 10 seconds.
    306 #define UMA_HISTOGRAM_LONG_TIMES(name, sample) UMA_HISTOGRAM_CUSTOM_TIMES( \
    307     name, sample, base::TimeDelta::FromMilliseconds(1), \
    308     base::TimeDelta::FromHours(1), 50)
    309 
    310 // Use this macro when times can routinely be much longer than 10 seconds and
    311 // you want 100 buckets.
    312 #define UMA_HISTOGRAM_LONG_TIMES_100(name, sample) UMA_HISTOGRAM_CUSTOM_TIMES( \
    313     name, sample, base::TimeDelta::FromMilliseconds(1), \
    314     base::TimeDelta::FromHours(1), 100)
    315 
    316 #define UMA_HISTOGRAM_CUSTOM_TIMES(name, sample, min, max, bucket_count) \
    317     STATIC_HISTOGRAM_POINTER_BLOCK(name, AddTime(sample), \
    318         base::Histogram::FactoryTimeGet(name, min, max, bucket_count, \
    319             base::HistogramBase::kUmaTargetedHistogramFlag))
    320 
    321 #define UMA_HISTOGRAM_COUNTS(name, sample) UMA_HISTOGRAM_CUSTOM_COUNTS( \
    322     name, sample, 1, 1000000, 50)
    323 
    324 #define UMA_HISTOGRAM_COUNTS_100(name, sample) UMA_HISTOGRAM_CUSTOM_COUNTS( \
    325     name, sample, 1, 100, 50)
    326 
    327 #define UMA_HISTOGRAM_COUNTS_10000(name, sample) UMA_HISTOGRAM_CUSTOM_COUNTS( \
    328     name, sample, 1, 10000, 50)
    329 
    330 #define UMA_HISTOGRAM_CUSTOM_COUNTS(name, sample, min, max, bucket_count) \
    331     STATIC_HISTOGRAM_POINTER_BLOCK(name, Add(sample), \
    332         base::Histogram::FactoryGet(name, min, max, bucket_count, \
    333             base::HistogramBase::kUmaTargetedHistogramFlag))
    334 
    335 #define UMA_HISTOGRAM_MEMORY_KB(name, sample) UMA_HISTOGRAM_CUSTOM_COUNTS( \
    336     name, sample, 1000, 500000, 50)
    337 
    338 #define UMA_HISTOGRAM_MEMORY_MB(name, sample) UMA_HISTOGRAM_CUSTOM_COUNTS( \
    339     name, sample, 1, 1000, 50)
    340 
    341 #define UMA_HISTOGRAM_PERCENTAGE(name, under_one_hundred) \
    342     UMA_HISTOGRAM_ENUMERATION(name, under_one_hundred, 101)
    343 
    344 #define UMA_HISTOGRAM_BOOLEAN(name, sample) \
    345     STATIC_HISTOGRAM_POINTER_BLOCK(name, AddBoolean(sample), \
    346         base::BooleanHistogram::FactoryGet(name, \
    347             base::HistogramBase::kUmaTargetedHistogramFlag))
    348 
    349 // The samples should always be strictly less than |boundary_value|.  For more
    350 // details, see the comment for the |HISTOGRAM_ENUMERATION| macro, above.
    351 #define UMA_HISTOGRAM_ENUMERATION(name, sample, boundary_value) \
    352     STATIC_HISTOGRAM_POINTER_BLOCK(name, Add(sample), \
    353         base::LinearHistogram::FactoryGet(name, 1, boundary_value, \
    354             boundary_value + 1, base::HistogramBase::kUmaTargetedHistogramFlag))
    355 
    356 #define UMA_HISTOGRAM_CUSTOM_ENUMERATION(name, sample, custom_ranges) \
    357     STATIC_HISTOGRAM_POINTER_BLOCK(name, Add(sample), \
    358         base::CustomHistogram::FactoryGet(name, custom_ranges, \
    359             base::HistogramBase::kUmaTargetedHistogramFlag))
    360 
    361 //------------------------------------------------------------------------------
    362 
    363 class BucketRanges;
    364 class SampleVector;
    365 
    366 class BooleanHistogram;
    367 class CustomHistogram;
    368 class Histogram;
    369 class LinearHistogram;
    370 
    371 class BASE_EXPORT Histogram : public HistogramBase {
    372  public:
    373   // Initialize maximum number of buckets in histograms as 16,384.
    374   static const size_t kBucketCount_MAX;
    375 
    376   typedef std::vector<Count> Counts;
    377 
    378   //----------------------------------------------------------------------------
    379   // For a valid histogram, input should follow these restrictions:
    380   // minimum > 0 (if a minimum below 1 is specified, it will implicitly be
    381   //              normalized up to 1)
    382   // maximum > minimum
    383   // buckets > 2 [minimum buckets needed: underflow, overflow and the range]
    384   // Additionally,
    385   // buckets <= (maximum - minimum + 2) - this is to ensure that we don't have
    386   // more buckets than the range of numbers; having more buckets than 1 per
    387   // value in the range would be nonsensical.
    388   static HistogramBase* FactoryGet(const std::string& name,
    389                                    Sample minimum,
    390                                    Sample maximum,
    391                                    size_t bucket_count,
    392                                    int32 flags);
    393   static HistogramBase* FactoryTimeGet(const std::string& name,
    394                                        base::TimeDelta minimum,
    395                                        base::TimeDelta maximum,
    396                                        size_t bucket_count,
    397                                        int32 flags);
    398 
    399   // Time call for use with DHISTOGRAM*.
    400   // Returns TimeTicks::Now() in debug and TimeTicks() in release build.
    401   static TimeTicks DebugNow();
    402 
    403   static void InitializeBucketRanges(Sample minimum,
    404                                      Sample maximum,
    405                                      BucketRanges* ranges);
    406 
    407   // This constant if for FindCorruption. Since snapshots of histograms are
    408   // taken asynchronously relative to sampling, and our counting code currently
    409   // does not prevent race conditions, it is pretty likely that we'll catch a
    410   // redundant count that doesn't match the sample count.  We allow for a
    411   // certain amount of slop before flagging this as an inconsistency. Even with
    412   // an inconsistency, we'll snapshot it again (for UMA in about a half hour),
    413   // so we'll eventually get the data, if it was not the result of a corruption.
    414   static const int kCommonRaceBasedCountMismatch;
    415 
    416   // Check to see if bucket ranges, counts and tallies in the snapshot are
    417   // consistent with the bucket ranges and checksums in our histogram.  This can
    418   // produce a false-alarm if a race occurred in the reading of the data during
    419   // a SnapShot process, but should otherwise be false at all times (unless we
    420   // have memory over-writes, or DRAM failures).
    421   virtual int FindCorruption(const HistogramSamples& samples) const OVERRIDE;
    422 
    423   //----------------------------------------------------------------------------
    424   // Accessors for factory construction, serialization and testing.
    425   //----------------------------------------------------------------------------
    426   Sample declared_min() const { return declared_min_; }
    427   Sample declared_max() const { return declared_max_; }
    428   virtual Sample ranges(size_t i) const;
    429   virtual size_t bucket_count() const;
    430   const BucketRanges* bucket_ranges() const { return bucket_ranges_; }
    431 
    432   // This function validates histogram construction arguments. It returns false
    433   // if some of the arguments are totally bad.
    434   // Note. Currently it allow some bad input, e.g. 0 as minimum, but silently
    435   // converts it to good input: 1.
    436   // TODO(kaiwang): Be more restrict and return false for any bad input, and
    437   // make this a readonly validating function.
    438   static bool InspectConstructionArguments(const std::string& name,
    439                                            Sample* minimum,
    440                                            Sample* maximum,
    441                                            size_t* bucket_count);
    442 
    443   // HistogramBase implementation:
    444   virtual HistogramType GetHistogramType() const OVERRIDE;
    445   virtual bool HasConstructionArguments(
    446       Sample expected_minimum,
    447       Sample expected_maximum,
    448       size_t expected_bucket_count) const OVERRIDE;
    449   virtual void Add(Sample value) OVERRIDE;
    450   virtual scoped_ptr<HistogramSamples> SnapshotSamples() const OVERRIDE;
    451   virtual void AddSamples(const HistogramSamples& samples) OVERRIDE;
    452   virtual bool AddSamplesFromPickle(PickleIterator* iter) OVERRIDE;
    453   virtual void WriteHTMLGraph(std::string* output) const OVERRIDE;
    454   virtual void WriteAscii(std::string* output) const OVERRIDE;
    455 
    456  protected:
    457   // |ranges| should contain the underflow and overflow buckets. See top
    458   // comments for example.
    459   Histogram(const std::string& name,
    460             Sample minimum,
    461             Sample maximum,
    462             const BucketRanges* ranges);
    463 
    464   virtual ~Histogram();
    465 
    466   // HistogramBase implementation:
    467   virtual bool SerializeInfoImpl(Pickle* pickle) const OVERRIDE;
    468 
    469   // Method to override to skip the display of the i'th bucket if it's empty.
    470   virtual bool PrintEmptyBucket(size_t index) const;
    471 
    472   // Get normalized size, relative to the ranges(i).
    473   virtual double GetBucketSize(Count current, size_t i) const;
    474 
    475   // Return a string description of what goes in a given bucket.
    476   // Most commonly this is the numeric value, but in derived classes it may
    477   // be a name (or string description) given to the bucket.
    478   virtual const std::string GetAsciiBucketRange(size_t it) const;
    479 
    480  private:
    481   // Allow tests to corrupt our innards for testing purposes.
    482   FRIEND_TEST_ALL_PREFIXES(HistogramTest, BoundsTest);
    483   FRIEND_TEST_ALL_PREFIXES(HistogramTest, BucketPlacementTest);
    484   FRIEND_TEST_ALL_PREFIXES(HistogramTest, CorruptBucketBounds);
    485   FRIEND_TEST_ALL_PREFIXES(HistogramTest, CorruptSampleCounts);
    486   FRIEND_TEST_ALL_PREFIXES(HistogramTest, NameMatchTest);
    487 
    488   friend class StatisticsRecorder;  // To allow it to delete duplicates.
    489   friend class StatisticsRecorderTest;
    490 
    491   friend BASE_EXPORT_PRIVATE HistogramBase* DeserializeHistogramInfo(
    492       PickleIterator* iter);
    493   static HistogramBase* DeserializeInfoImpl(PickleIterator* iter);
    494 
    495   // Implementation of SnapshotSamples function.
    496   scoped_ptr<SampleVector> SnapshotSampleVector() const;
    497 
    498   //----------------------------------------------------------------------------
    499   // Helpers for emitting Ascii graphic.  Each method appends data to output.
    500 
    501   void WriteAsciiImpl(bool graph_it,
    502                       const std::string& newline,
    503                       std::string* output) const;
    504 
    505   // Find out how large (graphically) the largest bucket will appear to be.
    506   double GetPeakBucketSize(const SampleVector& samples) const;
    507 
    508   // Write a common header message describing this histogram.
    509   void WriteAsciiHeader(const SampleVector& samples,
    510                         Count sample_count,
    511                         std::string* output) const;
    512 
    513   // Write information about previous, current, and next buckets.
    514   // Information such as cumulative percentage, etc.
    515   void WriteAsciiBucketContext(const int64 past, const Count current,
    516                                const int64 remaining, const size_t i,
    517                                std::string* output) const;
    518 
    519   // WriteJSON calls these.
    520   virtual void GetParameters(DictionaryValue* params) const OVERRIDE;
    521 
    522   virtual void GetCountAndBucketData(Count* count,
    523                                      int64* sum,
    524                                      ListValue* buckets) const OVERRIDE;
    525 
    526   // Does not own this object. Should get from StatisticsRecorder.
    527   const BucketRanges* bucket_ranges_;
    528 
    529   Sample declared_min_;  // Less than this goes into the first bucket.
    530   Sample declared_max_;  // Over this goes into the last bucket.
    531 
    532   // Finally, provide the state that changes with the addition of each new
    533   // sample.
    534   scoped_ptr<SampleVector> samples_;
    535 
    536   DISALLOW_COPY_AND_ASSIGN(Histogram);
    537 };
    538 
    539 //------------------------------------------------------------------------------
    540 
    541 // LinearHistogram is a more traditional histogram, with evenly spaced
    542 // buckets.
    543 class BASE_EXPORT LinearHistogram : public Histogram {
    544  public:
    545   virtual ~LinearHistogram();
    546 
    547   /* minimum should start from 1. 0 is as minimum is invalid. 0 is an implicit
    548      default underflow bucket. */
    549   static HistogramBase* FactoryGet(const std::string& name,
    550                                    Sample minimum,
    551                                    Sample maximum,
    552                                    size_t bucket_count,
    553                                    int32 flags);
    554   static HistogramBase* FactoryTimeGet(const std::string& name,
    555                                        TimeDelta minimum,
    556                                        TimeDelta maximum,
    557                                        size_t bucket_count,
    558                                        int32 flags);
    559 
    560   struct DescriptionPair {
    561     Sample sample;
    562     const char* description;  // Null means end of a list of pairs.
    563   };
    564 
    565   // Create a LinearHistogram and store a list of number/text values for use in
    566   // writing the histogram graph.
    567   // |descriptions| can be NULL, which means no special descriptions to set. If
    568   // it's not NULL, the last element in the array must has a NULL in its
    569   // "description" field.
    570   static HistogramBase* FactoryGetWithRangeDescription(
    571       const std::string& name,
    572       Sample minimum,
    573       Sample maximum,
    574       size_t bucket_count,
    575       int32 flags,
    576       const DescriptionPair descriptions[]);
    577 
    578   static void InitializeBucketRanges(Sample minimum,
    579                                      Sample maximum,
    580                                      BucketRanges* ranges);
    581 
    582   // Overridden from Histogram:
    583   virtual HistogramType GetHistogramType() const OVERRIDE;
    584 
    585  protected:
    586   LinearHistogram(const std::string& name,
    587                   Sample minimum,
    588                   Sample maximum,
    589                   const BucketRanges* ranges);
    590 
    591   virtual double GetBucketSize(Count current, size_t i) const OVERRIDE;
    592 
    593   // If we have a description for a bucket, then return that.  Otherwise
    594   // let parent class provide a (numeric) description.
    595   virtual const std::string GetAsciiBucketRange(size_t i) const OVERRIDE;
    596 
    597   // Skip printing of name for numeric range if we have a name (and if this is
    598   // an empty bucket).
    599   virtual bool PrintEmptyBucket(size_t index) const OVERRIDE;
    600 
    601  private:
    602   friend BASE_EXPORT_PRIVATE HistogramBase* DeserializeHistogramInfo(
    603       PickleIterator* iter);
    604   static HistogramBase* DeserializeInfoImpl(PickleIterator* iter);
    605 
    606   // For some ranges, we store a printable description of a bucket range.
    607   // If there is no description, then GetAsciiBucketRange() uses parent class
    608   // to provide a description.
    609   typedef std::map<Sample, std::string> BucketDescriptionMap;
    610   BucketDescriptionMap bucket_description_;
    611 
    612   DISALLOW_COPY_AND_ASSIGN(LinearHistogram);
    613 };
    614 
    615 //------------------------------------------------------------------------------
    616 
    617 // BooleanHistogram is a histogram for booleans.
    618 class BASE_EXPORT BooleanHistogram : public LinearHistogram {
    619  public:
    620   static HistogramBase* FactoryGet(const std::string& name, int32 flags);
    621 
    622   virtual HistogramType GetHistogramType() const OVERRIDE;
    623 
    624  private:
    625   BooleanHistogram(const std::string& name, const BucketRanges* ranges);
    626 
    627   friend BASE_EXPORT_PRIVATE HistogramBase* DeserializeHistogramInfo(
    628       PickleIterator* iter);
    629   static HistogramBase* DeserializeInfoImpl(PickleIterator* iter);
    630 
    631   DISALLOW_COPY_AND_ASSIGN(BooleanHistogram);
    632 };
    633 
    634 //------------------------------------------------------------------------------
    635 
    636 // CustomHistogram is a histogram for a set of custom integers.
    637 class BASE_EXPORT CustomHistogram : public Histogram {
    638  public:
    639   // |custom_ranges| contains a vector of limits on ranges. Each limit should be
    640   // > 0 and < kSampleType_MAX. (Currently 0 is still accepted for backward
    641   // compatibility). The limits can be unordered or contain duplication, but
    642   // client should not depend on this.
    643   static HistogramBase* FactoryGet(const std::string& name,
    644                                    const std::vector<Sample>& custom_ranges,
    645                                    int32 flags);
    646 
    647   // Overridden from Histogram:
    648   virtual HistogramType GetHistogramType() const OVERRIDE;
    649 
    650   // Helper method for transforming an array of valid enumeration values
    651   // to the std::vector<int> expected by HISTOGRAM_CUSTOM_ENUMERATION.
    652   // This function ensures that a guard bucket exists right after any
    653   // valid sample value (unless the next higher sample is also a valid value),
    654   // so that invalid samples never fall into the same bucket as valid samples.
    655   // TODO(kaiwang): Change name to ArrayToCustomEnumRanges.
    656   static std::vector<Sample> ArrayToCustomRanges(const Sample* values,
    657                                                  size_t num_values);
    658  protected:
    659   CustomHistogram(const std::string& name,
    660                   const BucketRanges* ranges);
    661 
    662   // HistogramBase implementation:
    663   virtual bool SerializeInfoImpl(Pickle* pickle) const OVERRIDE;
    664 
    665   virtual double GetBucketSize(Count current, size_t i) const OVERRIDE;
    666 
    667  private:
    668   friend BASE_EXPORT_PRIVATE HistogramBase* DeserializeHistogramInfo(
    669       PickleIterator* iter);
    670   static HistogramBase* DeserializeInfoImpl(PickleIterator* iter);
    671 
    672   static bool ValidateCustomRanges(const std::vector<Sample>& custom_ranges);
    673   static BucketRanges* CreateBucketRangesFromCustomRanges(
    674       const std::vector<Sample>& custom_ranges);
    675 
    676   DISALLOW_COPY_AND_ASSIGN(CustomHistogram);
    677 };
    678 
    679 }  // namespace base
    680 
    681 #endif  // BASE_METRICS_HISTOGRAM_H_
    682