|  | // Copyright (c) 2012 The Chromium Authors. All rights reserved. | 
|  | // Use of this source code is governed by a BSD-style license that can be | 
|  | // found in the LICENSE file. | 
|  |  | 
|  | // Histogram is an object that aggregates statistics, and can summarize them in | 
|  | // various forms, including ASCII graphical, HTML, and numerically (as a | 
|  | // vector of numbers corresponding to each of the aggregating buckets). | 
|  |  | 
|  | // It supports calls to accumulate either time intervals (which are processed | 
|  | // as integral number of milliseconds), or arbitrary integral units. | 
|  |  | 
|  | // For Histogram(exponential histogram), LinearHistogram and CustomHistogram, | 
|  | // the minimum for a declared range is 1 (instead of 0), while the maximum is | 
|  | // (HistogramBase::kSampleType_MAX - 1). Currently you can declare histograms | 
|  | // with ranges exceeding those limits (e.g. 0 as minimal or | 
|  | // HistogramBase::kSampleType_MAX as maximal), but those excesses will be | 
|  | // silently clamped to those limits (for backwards compatibility with existing | 
|  | // code). Best practice is to not exceed the limits. | 
|  |  | 
|  | // Each use of a histogram with the same name will reference the same underlying | 
|  | // data, so it is safe to record to the same histogram from multiple locations | 
|  | // in the code. It is a runtime error if all uses of the same histogram do not | 
|  | // agree exactly in type, bucket size and range. | 
|  |  | 
|  | // For Histogram and LinearHistogram, the maximum for a declared range should | 
|  | // always be larger (not equal) than minimal range. Zero and | 
|  | // HistogramBase::kSampleType_MAX are implicitly added as first and last ranges, | 
|  | // so the smallest legal bucket_count is 3. However CustomHistogram can have | 
|  | // bucket count as 2 (when you give a custom ranges vector containing only 1 | 
|  | // range). | 
|  | // For these 3 kinds of histograms, the max bucket count is always | 
|  | // (Histogram::kBucketCount_MAX - 1). | 
|  |  | 
|  | // The buckets layout of class Histogram is exponential. For example, buckets | 
|  | // might contain (sequentially) the count of values in the following intervals: | 
|  | // [0,1), [1,2), [2,4), [4,8), [8,16), [16,32), [32,64), [64,infinity) | 
|  | // That bucket allocation would actually result from construction of a histogram | 
|  | // for values between 1 and 64, with 8 buckets, such as: | 
|  | // Histogram count("some name", 1, 64, 8); | 
|  | // Note that the underflow bucket [0,1) and the overflow bucket [64,infinity) | 
|  | // are also counted by the constructor in the user supplied "bucket_count" | 
|  | // argument. | 
|  | // The above example has an exponential ratio of 2 (doubling the bucket width | 
|  | // in each consecutive bucket.  The Histogram class automatically calculates | 
|  | // the smallest ratio that it can use to construct the number of buckets | 
|  | // selected in the constructor.  An another example, if you had 50 buckets, | 
|  | // and millisecond time values from 1 to 10000, then the ratio between | 
|  | // consecutive bucket widths will be approximately somewhere around the 50th | 
|  | // root of 10000.  This approach provides very fine grain (narrow) buckets | 
|  | // at the low end of the histogram scale, but allows the histogram to cover a | 
|  | // gigantic range with the addition of very few buckets. | 
|  |  | 
|  | // Usually we use macros to define and use a histogram, which are defined in | 
|  | // base/metrics/histogram_macros.h. Note: Callers should include that header | 
|  | // directly if they only access the histogram APIs through macros. | 
|  | // | 
|  | // Macros use a pattern involving a function static variable, that is a pointer | 
|  | // to a histogram.  This static is explicitly initialized on any thread | 
|  | // that detects a uninitialized (NULL) pointer.  The potentially racy | 
|  | // initialization is not a problem as it is always set to point to the same | 
|  | // value (i.e., the FactoryGet always returns the same value).  FactoryGet | 
|  | // is also completely thread safe, which results in a completely thread safe, | 
|  | // and relatively fast, set of counters.  To avoid races at shutdown, the static | 
|  | // pointer is NOT deleted, and we leak the histograms at process termination. | 
|  |  | 
|  | #ifndef BASE_METRICS_HISTOGRAM_H_ | 
|  | #define BASE_METRICS_HISTOGRAM_H_ | 
|  |  | 
|  | #include <map> | 
|  | #include <string> | 
|  | #include <vector> | 
|  |  | 
|  | #include "base/base_export.h" | 
|  | #include "base/basictypes.h" | 
|  | #include "base/compiler_specific.h" | 
|  | #include "base/gtest_prod_util.h" | 
|  | #include "base/logging.h" | 
|  | #include "base/memory/scoped_ptr.h" | 
|  | #include "base/metrics/bucket_ranges.h" | 
|  | #include "base/metrics/histogram_base.h" | 
|  | // TODO(asvitkine): Migrate callers to to include this directly and remove this. | 
|  | #include "base/metrics/histogram_macros.h" | 
|  | #include "base/metrics/histogram_samples.h" | 
|  | #include "base/time/time.h" | 
|  |  | 
|  | namespace base { | 
|  |  | 
|  | class BooleanHistogram; | 
|  | class CustomHistogram; | 
|  | class Histogram; | 
|  | class LinearHistogram; | 
|  | class Pickle; | 
|  | class PickleIterator; | 
|  | class SampleVector; | 
|  |  | 
|  | class BASE_EXPORT Histogram : public HistogramBase { | 
|  | public: | 
|  | // Initialize maximum number of buckets in histograms as 16,384. | 
|  | static const size_t kBucketCount_MAX; | 
|  |  | 
|  | typedef std::vector<Count> Counts; | 
|  |  | 
|  | //---------------------------------------------------------------------------- | 
|  | // For a valid histogram, input should follow these restrictions: | 
|  | // minimum > 0 (if a minimum below 1 is specified, it will implicitly be | 
|  | //              normalized up to 1) | 
|  | // maximum > minimum | 
|  | // buckets > 2 [minimum buckets needed: underflow, overflow and the range] | 
|  | // Additionally, | 
|  | // buckets <= (maximum - minimum + 2) - this is to ensure that we don't have | 
|  | // more buckets than the range of numbers; having more buckets than 1 per | 
|  | // value in the range would be nonsensical. | 
|  | static HistogramBase* FactoryGet(const std::string& name, | 
|  | Sample minimum, | 
|  | Sample maximum, | 
|  | size_t bucket_count, | 
|  | int32 flags); | 
|  | static HistogramBase* FactoryTimeGet(const std::string& name, | 
|  | base::TimeDelta minimum, | 
|  | base::TimeDelta maximum, | 
|  | size_t bucket_count, | 
|  | int32 flags); | 
|  |  | 
|  | static void InitializeBucketRanges(Sample minimum, | 
|  | Sample maximum, | 
|  | BucketRanges* ranges); | 
|  |  | 
|  | // This constant if for FindCorruption. Since snapshots of histograms are | 
|  | // taken asynchronously relative to sampling, and our counting code currently | 
|  | // does not prevent race conditions, it is pretty likely that we'll catch a | 
|  | // redundant count that doesn't match the sample count.  We allow for a | 
|  | // certain amount of slop before flagging this as an inconsistency. Even with | 
|  | // an inconsistency, we'll snapshot it again (for UMA in about a half hour), | 
|  | // so we'll eventually get the data, if it was not the result of a corruption. | 
|  | static const int kCommonRaceBasedCountMismatch; | 
|  |  | 
|  | // Check to see if bucket ranges, counts and tallies in the snapshot are | 
|  | // consistent with the bucket ranges and checksums in our histogram.  This can | 
|  | // produce a false-alarm if a race occurred in the reading of the data during | 
|  | // a SnapShot process, but should otherwise be false at all times (unless we | 
|  | // have memory over-writes, or DRAM failures). | 
|  | int FindCorruption(const HistogramSamples& samples) const override; | 
|  |  | 
|  | //---------------------------------------------------------------------------- | 
|  | // Accessors for factory construction, serialization and testing. | 
|  | //---------------------------------------------------------------------------- | 
|  | Sample declared_min() const { return declared_min_; } | 
|  | Sample declared_max() const { return declared_max_; } | 
|  | virtual Sample ranges(size_t i) const; | 
|  | virtual size_t bucket_count() const; | 
|  | const BucketRanges* bucket_ranges() const { return bucket_ranges_; } | 
|  |  | 
|  | // This function validates histogram construction arguments. It returns false | 
|  | // if some of the arguments are totally bad. | 
|  | // Note. Currently it allow some bad input, e.g. 0 as minimum, but silently | 
|  | // converts it to good input: 1. | 
|  | // TODO(kaiwang): Be more restrict and return false for any bad input, and | 
|  | // make this a readonly validating function. | 
|  | static bool InspectConstructionArguments(const std::string& name, | 
|  | Sample* minimum, | 
|  | Sample* maximum, | 
|  | size_t* bucket_count); | 
|  |  | 
|  | // HistogramBase implementation: | 
|  | HistogramType GetHistogramType() const override; | 
|  | bool HasConstructionArguments(Sample expected_minimum, | 
|  | Sample expected_maximum, | 
|  | size_t expected_bucket_count) const override; | 
|  | void Add(Sample value) override; | 
|  | scoped_ptr<HistogramSamples> SnapshotSamples() const override; | 
|  | void AddSamples(const HistogramSamples& samples) override; | 
|  | bool AddSamplesFromPickle(base::PickleIterator* iter) override; | 
|  | void WriteHTMLGraph(std::string* output) const override; | 
|  | void WriteAscii(std::string* output) const override; | 
|  |  | 
|  | protected: | 
|  | // |ranges| should contain the underflow and overflow buckets. See top | 
|  | // comments for example. | 
|  | Histogram(const std::string& name, | 
|  | Sample minimum, | 
|  | Sample maximum, | 
|  | const BucketRanges* ranges); | 
|  |  | 
|  | ~Histogram() override; | 
|  |  | 
|  | // HistogramBase implementation: | 
|  | bool SerializeInfoImpl(base::Pickle* pickle) const override; | 
|  |  | 
|  | // Method to override to skip the display of the i'th bucket if it's empty. | 
|  | virtual bool PrintEmptyBucket(size_t index) const; | 
|  |  | 
|  | // Get normalized size, relative to the ranges(i). | 
|  | virtual double GetBucketSize(Count current, size_t i) const; | 
|  |  | 
|  | // Return a string description of what goes in a given bucket. | 
|  | // Most commonly this is the numeric value, but in derived classes it may | 
|  | // be a name (or string description) given to the bucket. | 
|  | virtual const std::string GetAsciiBucketRange(size_t it) const; | 
|  |  | 
|  | private: | 
|  | // Allow tests to corrupt our innards for testing purposes. | 
|  | FRIEND_TEST_ALL_PREFIXES(HistogramTest, BoundsTest); | 
|  | FRIEND_TEST_ALL_PREFIXES(HistogramTest, BucketPlacementTest); | 
|  | FRIEND_TEST_ALL_PREFIXES(HistogramTest, CorruptBucketBounds); | 
|  | FRIEND_TEST_ALL_PREFIXES(HistogramTest, CorruptSampleCounts); | 
|  | FRIEND_TEST_ALL_PREFIXES(HistogramTest, NameMatchTest); | 
|  |  | 
|  | friend class StatisticsRecorder;  // To allow it to delete duplicates. | 
|  | friend class StatisticsRecorderTest; | 
|  |  | 
|  | friend BASE_EXPORT_PRIVATE HistogramBase* DeserializeHistogramInfo( | 
|  | base::PickleIterator* iter); | 
|  | static HistogramBase* DeserializeInfoImpl(base::PickleIterator* iter); | 
|  |  | 
|  | // Implementation of SnapshotSamples function. | 
|  | scoped_ptr<SampleVector> SnapshotSampleVector() const; | 
|  |  | 
|  | //---------------------------------------------------------------------------- | 
|  | // Helpers for emitting Ascii graphic.  Each method appends data to output. | 
|  |  | 
|  | void WriteAsciiImpl(bool graph_it, | 
|  | const std::string& newline, | 
|  | std::string* output) const; | 
|  |  | 
|  | // Find out how large (graphically) the largest bucket will appear to be. | 
|  | double GetPeakBucketSize(const SampleVector& samples) const; | 
|  |  | 
|  | // Write a common header message describing this histogram. | 
|  | void WriteAsciiHeader(const SampleVector& samples, | 
|  | Count sample_count, | 
|  | std::string* output) const; | 
|  |  | 
|  | // Write information about previous, current, and next buckets. | 
|  | // Information such as cumulative percentage, etc. | 
|  | void WriteAsciiBucketContext(const int64 past, const Count current, | 
|  | const int64 remaining, const size_t i, | 
|  | std::string* output) const; | 
|  |  | 
|  | // WriteJSON calls these. | 
|  | void GetParameters(DictionaryValue* params) const override; | 
|  |  | 
|  | void GetCountAndBucketData(Count* count, | 
|  | int64* sum, | 
|  | ListValue* buckets) const override; | 
|  |  | 
|  | // Does not own this object. Should get from StatisticsRecorder. | 
|  | const BucketRanges* bucket_ranges_; | 
|  |  | 
|  | Sample declared_min_;  // Less than this goes into the first bucket. | 
|  | Sample declared_max_;  // Over this goes into the last bucket. | 
|  |  | 
|  | // Finally, provide the state that changes with the addition of each new | 
|  | // sample. | 
|  | scoped_ptr<SampleVector> samples_; | 
|  |  | 
|  | DISALLOW_COPY_AND_ASSIGN(Histogram); | 
|  | }; | 
|  |  | 
|  | //------------------------------------------------------------------------------ | 
|  |  | 
|  | // LinearHistogram is a more traditional histogram, with evenly spaced | 
|  | // buckets. | 
|  | class BASE_EXPORT LinearHistogram : public Histogram { | 
|  | public: | 
|  | ~LinearHistogram() override; | 
|  |  | 
|  | /* minimum should start from 1. 0 is as minimum is invalid. 0 is an implicit | 
|  | default underflow bucket. */ | 
|  | static HistogramBase* FactoryGet(const std::string& name, | 
|  | Sample minimum, | 
|  | Sample maximum, | 
|  | size_t bucket_count, | 
|  | int32 flags); | 
|  | static HistogramBase* FactoryTimeGet(const std::string& name, | 
|  | TimeDelta minimum, | 
|  | TimeDelta maximum, | 
|  | size_t bucket_count, | 
|  | int32 flags); | 
|  |  | 
|  | struct DescriptionPair { | 
|  | Sample sample; | 
|  | const char* description;  // Null means end of a list of pairs. | 
|  | }; | 
|  |  | 
|  | // Create a LinearHistogram and store a list of number/text values for use in | 
|  | // writing the histogram graph. | 
|  | // |descriptions| can be NULL, which means no special descriptions to set. If | 
|  | // it's not NULL, the last element in the array must has a NULL in its | 
|  | // "description" field. | 
|  | static HistogramBase* FactoryGetWithRangeDescription( | 
|  | const std::string& name, | 
|  | Sample minimum, | 
|  | Sample maximum, | 
|  | size_t bucket_count, | 
|  | int32 flags, | 
|  | const DescriptionPair descriptions[]); | 
|  |  | 
|  | static void InitializeBucketRanges(Sample minimum, | 
|  | Sample maximum, | 
|  | BucketRanges* ranges); | 
|  |  | 
|  | // Overridden from Histogram: | 
|  | HistogramType GetHistogramType() const override; | 
|  |  | 
|  | protected: | 
|  | LinearHistogram(const std::string& name, | 
|  | Sample minimum, | 
|  | Sample maximum, | 
|  | const BucketRanges* ranges); | 
|  |  | 
|  | double GetBucketSize(Count current, size_t i) const override; | 
|  |  | 
|  | // If we have a description for a bucket, then return that.  Otherwise | 
|  | // let parent class provide a (numeric) description. | 
|  | const std::string GetAsciiBucketRange(size_t i) const override; | 
|  |  | 
|  | // Skip printing of name for numeric range if we have a name (and if this is | 
|  | // an empty bucket). | 
|  | bool PrintEmptyBucket(size_t index) const override; | 
|  |  | 
|  | private: | 
|  | friend BASE_EXPORT_PRIVATE HistogramBase* DeserializeHistogramInfo( | 
|  | base::PickleIterator* iter); | 
|  | static HistogramBase* DeserializeInfoImpl(base::PickleIterator* iter); | 
|  |  | 
|  | // For some ranges, we store a printable description of a bucket range. | 
|  | // If there is no description, then GetAsciiBucketRange() uses parent class | 
|  | // to provide a description. | 
|  | typedef std::map<Sample, std::string> BucketDescriptionMap; | 
|  | BucketDescriptionMap bucket_description_; | 
|  |  | 
|  | DISALLOW_COPY_AND_ASSIGN(LinearHistogram); | 
|  | }; | 
|  |  | 
|  | //------------------------------------------------------------------------------ | 
|  |  | 
|  | // BooleanHistogram is a histogram for booleans. | 
|  | class BASE_EXPORT BooleanHistogram : public LinearHistogram { | 
|  | public: | 
|  | static HistogramBase* FactoryGet(const std::string& name, int32 flags); | 
|  |  | 
|  | HistogramType GetHistogramType() const override; | 
|  |  | 
|  | private: | 
|  | BooleanHistogram(const std::string& name, const BucketRanges* ranges); | 
|  |  | 
|  | friend BASE_EXPORT_PRIVATE HistogramBase* DeserializeHistogramInfo( | 
|  | base::PickleIterator* iter); | 
|  | static HistogramBase* DeserializeInfoImpl(base::PickleIterator* iter); | 
|  |  | 
|  | DISALLOW_COPY_AND_ASSIGN(BooleanHistogram); | 
|  | }; | 
|  |  | 
|  | //------------------------------------------------------------------------------ | 
|  |  | 
|  | // CustomHistogram is a histogram for a set of custom integers. | 
|  | class BASE_EXPORT CustomHistogram : public Histogram { | 
|  | public: | 
|  | // |custom_ranges| contains a vector of limits on ranges. Each limit should be | 
|  | // > 0 and < kSampleType_MAX. (Currently 0 is still accepted for backward | 
|  | // compatibility). The limits can be unordered or contain duplication, but | 
|  | // client should not depend on this. | 
|  | static HistogramBase* FactoryGet(const std::string& name, | 
|  | const std::vector<Sample>& custom_ranges, | 
|  | int32 flags); | 
|  |  | 
|  | // Overridden from Histogram: | 
|  | HistogramType GetHistogramType() const override; | 
|  |  | 
|  | // Helper method for transforming an array of valid enumeration values | 
|  | // to the std::vector<int> expected by UMA_HISTOGRAM_CUSTOM_ENUMERATION. | 
|  | // This function ensures that a guard bucket exists right after any | 
|  | // valid sample value (unless the next higher sample is also a valid value), | 
|  | // so that invalid samples never fall into the same bucket as valid samples. | 
|  | // TODO(kaiwang): Change name to ArrayToCustomEnumRanges. | 
|  | static std::vector<Sample> ArrayToCustomRanges(const Sample* values, | 
|  | size_t num_values); | 
|  | protected: | 
|  | CustomHistogram(const std::string& name, | 
|  | const BucketRanges* ranges); | 
|  |  | 
|  | // HistogramBase implementation: | 
|  | bool SerializeInfoImpl(base::Pickle* pickle) const override; | 
|  |  | 
|  | double GetBucketSize(Count current, size_t i) const override; | 
|  |  | 
|  | private: | 
|  | friend BASE_EXPORT_PRIVATE HistogramBase* DeserializeHistogramInfo( | 
|  | base::PickleIterator* iter); | 
|  | static HistogramBase* DeserializeInfoImpl(base::PickleIterator* iter); | 
|  |  | 
|  | static bool ValidateCustomRanges(const std::vector<Sample>& custom_ranges); | 
|  | static BucketRanges* CreateBucketRangesFromCustomRanges( | 
|  | const std::vector<Sample>& custom_ranges); | 
|  |  | 
|  | DISALLOW_COPY_AND_ASSIGN(CustomHistogram); | 
|  | }; | 
|  |  | 
|  | }  // namespace base | 
|  |  | 
|  | #endif  // BASE_METRICS_HISTOGRAM_H_ |