• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4 
5 // Histogram is an object that aggregates statistics, and can summarize them in
6 // various forms, including ASCII graphical, HTML, and numerically (as a
7 // vector of numbers corresponding to each of the aggregating buckets).
8 
9 // It supports calls to accumulate either time intervals (which are processed
10 // as integral number of milliseconds), or arbitrary integral units.
11 
12 // For Histogram(exponential histogram), LinearHistogram and CustomHistogram,
13 // the minimum for a declared range is 1 (instead of 0), while the maximum is
14 // (HistogramBase::kSampleType_MAX - 1). Currently you can declare histograms
15 // with ranges exceeding those limits (e.g. 0 as minimal or
16 // HistogramBase::kSampleType_MAX as maximal), but those excesses will be
17 // silently clamped to those limits (for backwards compatibility with existing
18 // code). Best practice is to not exceed the limits.
19 
20 // Each use of a histogram with the same name will reference the same underlying
21 // data, so it is safe to record to the same histogram from multiple locations
22 // in the code. It is a runtime error if all uses of the same histogram do not
23 // agree exactly in type, bucket size and range.
24 
25 // For Histogram and LinearHistogram, the maximum for a declared range should
26 // always be larger (not equal) than minimal range. Zero and
27 // HistogramBase::kSampleType_MAX are implicitly added as first and last ranges,
28 // so the smallest legal bucket_count is 3. However CustomHistogram can have
29 // bucket count as 2 (when you give a custom ranges vector containing only 1
30 // range).
31 // For these 3 kinds of histograms, the max bucket count is always
32 // (Histogram::kBucketCount_MAX - 1).
33 
34 // The buckets layout of class Histogram is exponential. For example, buckets
35 // might contain (sequentially) the count of values in the following intervals:
36 // [0,1), [1,2), [2,4), [4,8), [8,16), [16,32), [32,64), [64,infinity)
37 // That bucket allocation would actually result from construction of a histogram
38 // for values between 1 and 64, with 8 buckets, such as:
39 // Histogram count("some name", 1, 64, 8);
40 // Note that the underflow bucket [0,1) and the overflow bucket [64,infinity)
41 // are also counted by the constructor in the user supplied "bucket_count"
42 // argument.
43 // The above example has an exponential ratio of 2 (doubling the bucket width
44 // in each consecutive bucket.  The Histogram class automatically calculates
45 // the smallest ratio that it can use to construct the number of buckets
46 // selected in the constructor.  An another example, if you had 50 buckets,
47 // and millisecond time values from 1 to 10000, then the ratio between
48 // consecutive bucket widths will be approximately somewhere around the 50th
49 // root of 10000.  This approach provides very fine grain (narrow) buckets
50 // at the low end of the histogram scale, but allows the histogram to cover a
51 // gigantic range with the addition of very few buckets.
52 
53 // Usually we use macros to define and use a histogram. These macros use a
54 // pattern involving a function static variable, that is a pointer to a
55 // histogram.  This static is explicitly initialized on any thread
56 // that detects a uninitialized (NULL) pointer.  The potentially racy
57 // initialization is not a problem as it is always set to point to the same
58 // value (i.e., the FactoryGet always returns the same value).  FactoryGet
59 // is also completely thread safe, which results in a completely thread safe,
60 // and relatively fast, set of counters.  To avoid races at shutdown, the static
61 // pointer is NOT deleted, and we leak the histograms at process termination.
62 
63 #ifndef BASE_METRICS_HISTOGRAM_H_
64 #define BASE_METRICS_HISTOGRAM_H_
65 
66 #include <map>
67 #include <string>
68 #include <vector>
69 
70 #include "base/atomicops.h"
71 #include "base/base_export.h"
72 #include "base/basictypes.h"
73 #include "base/compiler_specific.h"
74 #include "base/gtest_prod_util.h"
75 #include "base/logging.h"
76 #include "base/memory/scoped_ptr.h"
77 #include "base/metrics/bucket_ranges.h"
78 #include "base/metrics/histogram_base.h"
79 #include "base/metrics/histogram_samples.h"
80 #include "base/time/time.h"
81 
82 class Pickle;
83 class PickleIterator;
84 
85 namespace base {
86 
87 class Lock;
88 //------------------------------------------------------------------------------
89 // Histograms are often put in areas where they are called many many times, and
90 // performance is critical.  As a result, they are designed to have a very low
91 // recurring cost of executing (adding additional samples).  Toward that end,
92 // the macros declare a static pointer to the histogram in question, and only
93 // take a "slow path" to construct (or find) the histogram on the first run
94 // through the macro.  We leak the histograms at shutdown time so that we don't
95 // have to validate using the pointers at any time during the running of the
96 // process.
97 
98 // The following code is generally what a thread-safe static pointer
99 // initialization looks like for a histogram (after a macro is expanded).  This
100 // sample is an expansion (with comments) of the code for
101 // HISTOGRAM_CUSTOM_COUNTS().
102 
103 /*
104   do {
105     // The pointer's presence indicates the initialization is complete.
106     // Initialization is idempotent, so it can safely be atomically repeated.
107     static base::subtle::AtomicWord atomic_histogram_pointer = 0;
108 
109     // Acquire_Load() ensures that we acquire visibility to the pointed-to data
110     // in the histogram.
111     base::Histogram* histogram_pointer(reinterpret_cast<base::Histogram*>(
112         base::subtle::Acquire_Load(&atomic_histogram_pointer)));
113 
114     if (!histogram_pointer) {
115       // This is the slow path, which will construct OR find the matching
116       // histogram.  FactoryGet includes locks on a global histogram name map
117       // and is completely thread safe.
118       histogram_pointer = base::Histogram::FactoryGet(
119           name, min, max, bucket_count, base::HistogramBase::kNoFlags);
120 
121       // Use Release_Store to ensure that the histogram data is made available
122       // globally before we make the pointer visible.
123       // Several threads may perform this store, but the same value will be
124       // stored in all cases (for a given named/spec'ed histogram).
125       // We could do this without any barrier, since FactoryGet entered and
126       // exited a lock after construction, but this barrier makes things clear.
127       base::subtle::Release_Store(&atomic_histogram_pointer,
128           reinterpret_cast<base::subtle::AtomicWord>(histogram_pointer));
129     }
130 
131     // Ensure calling contract is upheld, and the name does NOT vary.
132     DCHECK(histogram_pointer->histogram_name() == constant_histogram_name);
133 
134     histogram_pointer->Add(sample);
135   } while (0);
136 */
137 
138 // The above pattern is repeated in several macros.  The only elements that
139 // vary are the invocation of the Add(sample) vs AddTime(sample), and the choice
140 // of which FactoryGet method to use.  The different FactoryGet methods have
141 // various argument lists, so the function with its argument list is provided as
142 // a macro argument here.  The name is only used in a DCHECK, to assure that
143 // callers don't try to vary the name of the histogram (which would tend to be
144 // ignored by the one-time initialization of the histogtram_pointer).
145 #define STATIC_HISTOGRAM_POINTER_BLOCK(constant_histogram_name, \
146                                        histogram_add_method_invocation, \
147                                        histogram_factory_get_invocation) \
148   do { \
149     static base::subtle::AtomicWord atomic_histogram_pointer = 0; \
150     base::HistogramBase* histogram_pointer( \
151         reinterpret_cast<base::HistogramBase*>( \
152             base::subtle::Acquire_Load(&atomic_histogram_pointer))); \
153     if (!histogram_pointer) { \
154       histogram_pointer = histogram_factory_get_invocation; \
155       base::subtle::Release_Store(&atomic_histogram_pointer, \
156           reinterpret_cast<base::subtle::AtomicWord>(histogram_pointer)); \
157     } \
158     if (DCHECK_IS_ON) \
159       histogram_pointer->CheckName(constant_histogram_name); \
160     histogram_pointer->histogram_add_method_invocation; \
161   } while (0)
162 
163 
164 //------------------------------------------------------------------------------
165 // Provide easy general purpose histogram in a macro, just like stats counters.
166 // The first four macros use 50 buckets.
167 
168 #define HISTOGRAM_TIMES(name, sample) HISTOGRAM_CUSTOM_TIMES( \
169     name, sample, base::TimeDelta::FromMilliseconds(1), \
170     base::TimeDelta::FromSeconds(10), 50)
171 
172 // For folks that need real specific times, use this to select a precise range
173 // of times you want plotted, and the number of buckets you want used.
174 #define HISTOGRAM_CUSTOM_TIMES(name, sample, min, max, bucket_count) \
175     STATIC_HISTOGRAM_POINTER_BLOCK(name, AddTime(sample), \
176         base::Histogram::FactoryTimeGet(name, min, max, bucket_count, \
177                                         base::HistogramBase::kNoFlags))
178 
179 #define HISTOGRAM_COUNTS(name, sample) HISTOGRAM_CUSTOM_COUNTS( \
180     name, sample, 1, 1000000, 50)
181 
182 #define HISTOGRAM_COUNTS_100(name, sample) HISTOGRAM_CUSTOM_COUNTS( \
183     name, sample, 1, 100, 50)
184 
185 #define HISTOGRAM_COUNTS_10000(name, sample) HISTOGRAM_CUSTOM_COUNTS( \
186     name, sample, 1, 10000, 50)
187 
188 #define HISTOGRAM_CUSTOM_COUNTS(name, sample, min, max, bucket_count) \
189     STATIC_HISTOGRAM_POINTER_BLOCK(name, Add(sample), \
190         base::Histogram::FactoryGet(name, min, max, bucket_count, \
191                                     base::HistogramBase::kNoFlags))
192 
193 // This is a helper macro used by other macros and shouldn't be used directly.
194 #define HISTOGRAM_ENUMERATION_WITH_FLAG(name, sample, boundary, flag) \
195     STATIC_HISTOGRAM_POINTER_BLOCK(name, Add(sample), \
196         base::LinearHistogram::FactoryGet(name, 1, boundary, boundary + 1, \
197             flag))
198 
199 #define HISTOGRAM_PERCENTAGE(name, under_one_hundred) \
200     HISTOGRAM_ENUMERATION(name, under_one_hundred, 101)
201 
202 #define HISTOGRAM_BOOLEAN(name, sample) \
203     STATIC_HISTOGRAM_POINTER_BLOCK(name, AddBoolean(sample), \
204         base::BooleanHistogram::FactoryGet(name, base::Histogram::kNoFlags))
205 
206 // Support histograming of an enumerated value.  The samples should always be
207 // strictly less than |boundary_value| -- this prevents you from running into
208 // problems down the line if you add additional buckets to the histogram.  Note
209 // also that, despite explicitly setting the minimum bucket value to |1| below,
210 // it is fine for enumerated histograms to be 0-indexed -- this is because
211 // enumerated histograms should never have underflow.
212 #define HISTOGRAM_ENUMERATION(name, sample, boundary_value) \
213     STATIC_HISTOGRAM_POINTER_BLOCK(name, Add(sample), \
214         base::LinearHistogram::FactoryGet(name, 1, boundary_value, \
215             boundary_value + 1, base::HistogramBase::kNoFlags))
216 
217 // Support histograming of an enumerated value. Samples should be one of the
218 // std::vector<int> list provided via |custom_ranges|. See comments above
219 // CustomRanges::FactoryGet about the requirement of |custom_ranges|.
220 // You can use the helper function CustomHistogram::ArrayToCustomRanges to
221 // transform a C-style array of valid sample values to a std::vector<int>.
222 #define HISTOGRAM_CUSTOM_ENUMERATION(name, sample, custom_ranges) \
223     STATIC_HISTOGRAM_POINTER_BLOCK(name, Add(sample), \
224         base::CustomHistogram::FactoryGet(name, custom_ranges, \
225                                           base::HistogramBase::kNoFlags))
226 
227 #define HISTOGRAM_MEMORY_KB(name, sample) HISTOGRAM_CUSTOM_COUNTS( \
228     name, sample, 1000, 500000, 50)
229 
230 //------------------------------------------------------------------------------
231 // Define Debug vs non-debug flavors of macros.
232 #ifndef NDEBUG
233 
234 #define DHISTOGRAM_TIMES(name, sample) HISTOGRAM_TIMES(name, sample)
235 #define DHISTOGRAM_COUNTS(name, sample) HISTOGRAM_COUNTS(name, sample)
236 #define DHISTOGRAM_PERCENTAGE(name, under_one_hundred) HISTOGRAM_PERCENTAGE(\
237     name, under_one_hundred)
238 #define DHISTOGRAM_CUSTOM_TIMES(name, sample, min, max, bucket_count) \
239     HISTOGRAM_CUSTOM_TIMES(name, sample, min, max, bucket_count)
240 #define DHISTOGRAM_CLIPPED_TIMES(name, sample, min, max, bucket_count) \
241     HISTOGRAM_CLIPPED_TIMES(name, sample, min, max, bucket_count)
242 #define DHISTOGRAM_CUSTOM_COUNTS(name, sample, min, max, bucket_count) \
243     HISTOGRAM_CUSTOM_COUNTS(name, sample, min, max, bucket_count)
244 #define DHISTOGRAM_ENUMERATION(name, sample, boundary_value) \
245     HISTOGRAM_ENUMERATION(name, sample, boundary_value)
246 #define DHISTOGRAM_CUSTOM_ENUMERATION(name, sample, custom_ranges) \
247     HISTOGRAM_CUSTOM_ENUMERATION(name, sample, custom_ranges)
248 
249 #else  // NDEBUG
250 // Keep a mention of passed variables to avoid unused variable warnings in
251 // release build if these variables are only used in macros.
252 #define DISCARD_2_ARGUMENTS(a, b) \
253   while (0) { \
254     static_cast<void>(a); \
255     static_cast<void>(b); \
256  }
257 #define DISCARD_3_ARGUMENTS(a, b, c) \
258   while (0) { \
259     static_cast<void>(a); \
260     static_cast<void>(b); \
261     static_cast<void>(c); \
262  }
263 #define DISCARD_5_ARGUMENTS(a, b, c, d ,e) \
264   while (0) { \
265     static_cast<void>(a); \
266     static_cast<void>(b); \
267     static_cast<void>(c); \
268     static_cast<void>(d); \
269     static_cast<void>(e); \
270  }
271 #define DHISTOGRAM_TIMES(name, sample) \
272     DISCARD_2_ARGUMENTS(name, sample)
273 
274 #define DHISTOGRAM_COUNTS(name, sample) \
275     DISCARD_2_ARGUMENTS(name, sample)
276 
277 #define DHISTOGRAM_PERCENTAGE(name, under_one_hundred) \
278     DISCARD_2_ARGUMENTS(name, under_one_hundred)
279 
280 #define DHISTOGRAM_CUSTOM_TIMES(name, sample, min, max, bucket_count) \
281     DISCARD_5_ARGUMENTS(name, sample, min, max, bucket_count)
282 
283 #define DHISTOGRAM_CLIPPED_TIMES(name, sample, min, max, bucket_count) \
284     DISCARD_5_ARGUMENTS(name, sample, min, max, bucket_count)
285 
286 #define DHISTOGRAM_CUSTOM_COUNTS(name, sample, min, max, bucket_count) \
287     DISCARD_5_ARGUMENTS(name, sample, min, max, bucket_count)
288 
289 #define DHISTOGRAM_ENUMERATION(name, sample, boundary_value) \
290     DISCARD_3_ARGUMENTS(name, sample, boundary_value)
291 
292 #define DHISTOGRAM_CUSTOM_ENUMERATION(name, sample, custom_ranges) \
293     DISCARD_3_ARGUMENTS(name, sample, custom_ranges)
294 
295 #endif  // NDEBUG
296 
297 //------------------------------------------------------------------------------
298 // The following macros provide typical usage scenarios for callers that wish
299 // to record histogram data, and have the data submitted/uploaded via UMA.
300 // Not all systems support such UMA, but if they do, the following macros
301 // should work with the service.
302 
303 #define UMA_HISTOGRAM_TIMES(name, sample) UMA_HISTOGRAM_CUSTOM_TIMES( \
304     name, sample, base::TimeDelta::FromMilliseconds(1), \
305     base::TimeDelta::FromSeconds(10), 50)
306 
307 #define UMA_HISTOGRAM_MEDIUM_TIMES(name, sample) UMA_HISTOGRAM_CUSTOM_TIMES( \
308     name, sample, base::TimeDelta::FromMilliseconds(10), \
309     base::TimeDelta::FromMinutes(3), 50)
310 
311 // Use this macro when times can routinely be much longer than 10 seconds.
312 #define UMA_HISTOGRAM_LONG_TIMES(name, sample) UMA_HISTOGRAM_CUSTOM_TIMES( \
313     name, sample, base::TimeDelta::FromMilliseconds(1), \
314     base::TimeDelta::FromHours(1), 50)
315 
316 // Use this macro when times can routinely be much longer than 10 seconds and
317 // you want 100 buckets.
318 #define UMA_HISTOGRAM_LONG_TIMES_100(name, sample) UMA_HISTOGRAM_CUSTOM_TIMES( \
319     name, sample, base::TimeDelta::FromMilliseconds(1), \
320     base::TimeDelta::FromHours(1), 100)
321 
322 #define UMA_HISTOGRAM_CUSTOM_TIMES(name, sample, min, max, bucket_count) \
323     STATIC_HISTOGRAM_POINTER_BLOCK(name, AddTime(sample), \
324         base::Histogram::FactoryTimeGet(name, min, max, bucket_count, \
325             base::HistogramBase::kUmaTargetedHistogramFlag))
326 
327 #define UMA_HISTOGRAM_COUNTS(name, sample) UMA_HISTOGRAM_CUSTOM_COUNTS( \
328     name, sample, 1, 1000000, 50)
329 
330 #define UMA_HISTOGRAM_COUNTS_100(name, sample) UMA_HISTOGRAM_CUSTOM_COUNTS( \
331     name, sample, 1, 100, 50)
332 
333 #define UMA_HISTOGRAM_COUNTS_10000(name, sample) UMA_HISTOGRAM_CUSTOM_COUNTS( \
334     name, sample, 1, 10000, 50)
335 
336 #define UMA_HISTOGRAM_CUSTOM_COUNTS(name, sample, min, max, bucket_count) \
337     STATIC_HISTOGRAM_POINTER_BLOCK(name, Add(sample), \
338         base::Histogram::FactoryGet(name, min, max, bucket_count, \
339             base::HistogramBase::kUmaTargetedHistogramFlag))
340 
341 #define UMA_HISTOGRAM_MEMORY_KB(name, sample) UMA_HISTOGRAM_CUSTOM_COUNTS( \
342     name, sample, 1000, 500000, 50)
343 
344 #define UMA_HISTOGRAM_MEMORY_MB(name, sample) UMA_HISTOGRAM_CUSTOM_COUNTS( \
345     name, sample, 1, 1000, 50)
346 
347 #define UMA_HISTOGRAM_PERCENTAGE(name, under_one_hundred) \
348     UMA_HISTOGRAM_ENUMERATION(name, under_one_hundred, 101)
349 
350 #define UMA_HISTOGRAM_BOOLEAN(name, sample) \
351     STATIC_HISTOGRAM_POINTER_BLOCK(name, AddBoolean(sample), \
352         base::BooleanHistogram::FactoryGet(name, \
353             base::HistogramBase::kUmaTargetedHistogramFlag))
354 
355 // The samples should always be strictly less than |boundary_value|.  For more
356 // details, see the comment for the |HISTOGRAM_ENUMERATION| macro, above.
357 #define UMA_HISTOGRAM_ENUMERATION(name, sample, boundary_value) \
358     HISTOGRAM_ENUMERATION_WITH_FLAG(name, sample, boundary_value, \
359         base::HistogramBase::kUmaTargetedHistogramFlag)
360 
361 // Similar to UMA_HISTOGRAM_ENUMERATION, but used for recording stability
362 // histograms.  Use this if recording a histogram that should be part of the
363 // initial stability log.
364 #define UMA_STABILITY_HISTOGRAM_ENUMERATION(name, sample, boundary_value) \
365     HISTOGRAM_ENUMERATION_WITH_FLAG(name, sample, boundary_value, \
366         base::HistogramBase::kUmaStabilityHistogramFlag)
367 
368 #define UMA_HISTOGRAM_CUSTOM_ENUMERATION(name, sample, custom_ranges) \
369     STATIC_HISTOGRAM_POINTER_BLOCK(name, Add(sample), \
370         base::CustomHistogram::FactoryGet(name, custom_ranges, \
371             base::HistogramBase::kUmaTargetedHistogramFlag))
372 
373 //------------------------------------------------------------------------------
374 
375 class BucketRanges;
376 class SampleVector;
377 
378 class BooleanHistogram;
379 class CustomHistogram;
380 class Histogram;
381 class LinearHistogram;
382 
383 class BASE_EXPORT Histogram : public HistogramBase {
384  public:
385   // Initialize maximum number of buckets in histograms as 16,384.
386   static const size_t kBucketCount_MAX;
387 
388   typedef std::vector<Count> Counts;
389 
390   //----------------------------------------------------------------------------
391   // For a valid histogram, input should follow these restrictions:
392   // minimum > 0 (if a minimum below 1 is specified, it will implicitly be
393   //              normalized up to 1)
394   // maximum > minimum
395   // buckets > 2 [minimum buckets needed: underflow, overflow and the range]
396   // Additionally,
397   // buckets <= (maximum - minimum + 2) - this is to ensure that we don't have
398   // more buckets than the range of numbers; having more buckets than 1 per
399   // value in the range would be nonsensical.
400   static HistogramBase* FactoryGet(const std::string& name,
401                                    Sample minimum,
402                                    Sample maximum,
403                                    size_t bucket_count,
404                                    int32 flags);
405   static HistogramBase* FactoryTimeGet(const std::string& name,
406                                        base::TimeDelta minimum,
407                                        base::TimeDelta maximum,
408                                        size_t bucket_count,
409                                        int32 flags);
410 
411   // Time call for use with DHISTOGRAM*.
412   // Returns TimeTicks::Now() in debug and TimeTicks() in release build.
413   static TimeTicks DebugNow();
414 
415   static void InitializeBucketRanges(Sample minimum,
416                                      Sample maximum,
417                                      BucketRanges* ranges);
418 
419   // This constant if for FindCorruption. Since snapshots of histograms are
420   // taken asynchronously relative to sampling, and our counting code currently
421   // does not prevent race conditions, it is pretty likely that we'll catch a
422   // redundant count that doesn't match the sample count.  We allow for a
423   // certain amount of slop before flagging this as an inconsistency. Even with
424   // an inconsistency, we'll snapshot it again (for UMA in about a half hour),
425   // so we'll eventually get the data, if it was not the result of a corruption.
426   static const int kCommonRaceBasedCountMismatch;
427 
428   // Check to see if bucket ranges, counts and tallies in the snapshot are
429   // consistent with the bucket ranges and checksums in our histogram.  This can
430   // produce a false-alarm if a race occurred in the reading of the data during
431   // a SnapShot process, but should otherwise be false at all times (unless we
432   // have memory over-writes, or DRAM failures).
433   virtual int FindCorruption(const HistogramSamples& samples) const OVERRIDE;
434 
435   //----------------------------------------------------------------------------
436   // Accessors for factory construction, serialization and testing.
437   //----------------------------------------------------------------------------
declared_min()438   Sample declared_min() const { return declared_min_; }
declared_max()439   Sample declared_max() const { return declared_max_; }
440   virtual Sample ranges(size_t i) const;
441   virtual size_t bucket_count() const;
bucket_ranges()442   const BucketRanges* bucket_ranges() const { return bucket_ranges_; }
443 
444   // This function validates histogram construction arguments. It returns false
445   // if some of the arguments are totally bad.
446   // Note. Currently it allow some bad input, e.g. 0 as minimum, but silently
447   // converts it to good input: 1.
448   // TODO(kaiwang): Be more restrict and return false for any bad input, and
449   // make this a readonly validating function.
450   static bool InspectConstructionArguments(const std::string& name,
451                                            Sample* minimum,
452                                            Sample* maximum,
453                                            size_t* bucket_count);
454 
455   // HistogramBase implementation:
456   virtual HistogramType GetHistogramType() const OVERRIDE;
457   virtual bool HasConstructionArguments(
458       Sample expected_minimum,
459       Sample expected_maximum,
460       size_t expected_bucket_count) const OVERRIDE;
461   virtual void Add(Sample value) OVERRIDE;
462   virtual scoped_ptr<HistogramSamples> SnapshotSamples() const OVERRIDE;
463   virtual void AddSamples(const HistogramSamples& samples) OVERRIDE;
464   virtual bool AddSamplesFromPickle(PickleIterator* iter) OVERRIDE;
465   virtual void WriteHTMLGraph(std::string* output) const OVERRIDE;
466   virtual void WriteAscii(std::string* output) const OVERRIDE;
467 
468  protected:
469   // |ranges| should contain the underflow and overflow buckets. See top
470   // comments for example.
471   Histogram(const std::string& name,
472             Sample minimum,
473             Sample maximum,
474             const BucketRanges* ranges);
475 
476   virtual ~Histogram();
477 
478   // HistogramBase implementation:
479   virtual bool SerializeInfoImpl(Pickle* pickle) const OVERRIDE;
480 
481   // Method to override to skip the display of the i'th bucket if it's empty.
482   virtual bool PrintEmptyBucket(size_t index) const;
483 
484   // Get normalized size, relative to the ranges(i).
485   virtual double GetBucketSize(Count current, size_t i) const;
486 
487   // Return a string description of what goes in a given bucket.
488   // Most commonly this is the numeric value, but in derived classes it may
489   // be a name (or string description) given to the bucket.
490   virtual const std::string GetAsciiBucketRange(size_t it) const;
491 
492  private:
493   // Allow tests to corrupt our innards for testing purposes.
494   FRIEND_TEST_ALL_PREFIXES(HistogramTest, BoundsTest);
495   FRIEND_TEST_ALL_PREFIXES(HistogramTest, BucketPlacementTest);
496   FRIEND_TEST_ALL_PREFIXES(HistogramTest, CorruptBucketBounds);
497   FRIEND_TEST_ALL_PREFIXES(HistogramTest, CorruptSampleCounts);
498   FRIEND_TEST_ALL_PREFIXES(HistogramTest, NameMatchTest);
499 
500   friend class StatisticsRecorder;  // To allow it to delete duplicates.
501   friend class StatisticsRecorderTest;
502 
503   friend BASE_EXPORT_PRIVATE HistogramBase* DeserializeHistogramInfo(
504       PickleIterator* iter);
505   static HistogramBase* DeserializeInfoImpl(PickleIterator* iter);
506 
507   // Implementation of SnapshotSamples function.
508   scoped_ptr<SampleVector> SnapshotSampleVector() const;
509 
510   //----------------------------------------------------------------------------
511   // Helpers for emitting Ascii graphic.  Each method appends data to output.
512 
513   void WriteAsciiImpl(bool graph_it,
514                       const std::string& newline,
515                       std::string* output) const;
516 
517   // Find out how large (graphically) the largest bucket will appear to be.
518   double GetPeakBucketSize(const SampleVector& samples) const;
519 
520   // Write a common header message describing this histogram.
521   void WriteAsciiHeader(const SampleVector& samples,
522                         Count sample_count,
523                         std::string* output) const;
524 
525   // Write information about previous, current, and next buckets.
526   // Information such as cumulative percentage, etc.
527   void WriteAsciiBucketContext(const int64 past, const Count current,
528                                const int64 remaining, const size_t i,
529                                std::string* output) const;
530 
531   // WriteJSON calls these.
532   virtual void GetParameters(DictionaryValue* params) const OVERRIDE;
533 
534   virtual void GetCountAndBucketData(Count* count,
535                                      int64* sum,
536                                      ListValue* buckets) const OVERRIDE;
537 
538   // Does not own this object. Should get from StatisticsRecorder.
539   const BucketRanges* bucket_ranges_;
540 
541   Sample declared_min_;  // Less than this goes into the first bucket.
542   Sample declared_max_;  // Over this goes into the last bucket.
543 
544   // Finally, provide the state that changes with the addition of each new
545   // sample.
546   scoped_ptr<SampleVector> samples_;
547 
548   DISALLOW_COPY_AND_ASSIGN(Histogram);
549 };
550 
551 //------------------------------------------------------------------------------
552 
553 // LinearHistogram is a more traditional histogram, with evenly spaced
554 // buckets.
555 class BASE_EXPORT LinearHistogram : public Histogram {
556  public:
557   virtual ~LinearHistogram();
558 
559   /* minimum should start from 1. 0 is as minimum is invalid. 0 is an implicit
560      default underflow bucket. */
561   static HistogramBase* FactoryGet(const std::string& name,
562                                    Sample minimum,
563                                    Sample maximum,
564                                    size_t bucket_count,
565                                    int32 flags);
566   static HistogramBase* FactoryTimeGet(const std::string& name,
567                                        TimeDelta minimum,
568                                        TimeDelta maximum,
569                                        size_t bucket_count,
570                                        int32 flags);
571 
572   struct DescriptionPair {
573     Sample sample;
574     const char* description;  // Null means end of a list of pairs.
575   };
576 
577   // Create a LinearHistogram and store a list of number/text values for use in
578   // writing the histogram graph.
579   // |descriptions| can be NULL, which means no special descriptions to set. If
580   // it's not NULL, the last element in the array must has a NULL in its
581   // "description" field.
582   static HistogramBase* FactoryGetWithRangeDescription(
583       const std::string& name,
584       Sample minimum,
585       Sample maximum,
586       size_t bucket_count,
587       int32 flags,
588       const DescriptionPair descriptions[]);
589 
590   static void InitializeBucketRanges(Sample minimum,
591                                      Sample maximum,
592                                      BucketRanges* ranges);
593 
594   // Overridden from Histogram:
595   virtual HistogramType GetHistogramType() const OVERRIDE;
596 
597  protected:
598   LinearHistogram(const std::string& name,
599                   Sample minimum,
600                   Sample maximum,
601                   const BucketRanges* ranges);
602 
603   virtual double GetBucketSize(Count current, size_t i) const OVERRIDE;
604 
605   // If we have a description for a bucket, then return that.  Otherwise
606   // let parent class provide a (numeric) description.
607   virtual const std::string GetAsciiBucketRange(size_t i) const OVERRIDE;
608 
609   // Skip printing of name for numeric range if we have a name (and if this is
610   // an empty bucket).
611   virtual bool PrintEmptyBucket(size_t index) const OVERRIDE;
612 
613  private:
614   friend BASE_EXPORT_PRIVATE HistogramBase* DeserializeHistogramInfo(
615       PickleIterator* iter);
616   static HistogramBase* DeserializeInfoImpl(PickleIterator* iter);
617 
618   // For some ranges, we store a printable description of a bucket range.
619   // If there is no description, then GetAsciiBucketRange() uses parent class
620   // to provide a description.
621   typedef std::map<Sample, std::string> BucketDescriptionMap;
622   BucketDescriptionMap bucket_description_;
623 
624   DISALLOW_COPY_AND_ASSIGN(LinearHistogram);
625 };
626 
627 //------------------------------------------------------------------------------
628 
629 // BooleanHistogram is a histogram for booleans.
630 class BASE_EXPORT BooleanHistogram : public LinearHistogram {
631  public:
632   static HistogramBase* FactoryGet(const std::string& name, int32 flags);
633 
634   virtual HistogramType GetHistogramType() const OVERRIDE;
635 
636  private:
637   BooleanHistogram(const std::string& name, const BucketRanges* ranges);
638 
639   friend BASE_EXPORT_PRIVATE HistogramBase* DeserializeHistogramInfo(
640       PickleIterator* iter);
641   static HistogramBase* DeserializeInfoImpl(PickleIterator* iter);
642 
643   DISALLOW_COPY_AND_ASSIGN(BooleanHistogram);
644 };
645 
646 //------------------------------------------------------------------------------
647 
648 // CustomHistogram is a histogram for a set of custom integers.
649 class BASE_EXPORT CustomHistogram : public Histogram {
650  public:
651   // |custom_ranges| contains a vector of limits on ranges. Each limit should be
652   // > 0 and < kSampleType_MAX. (Currently 0 is still accepted for backward
653   // compatibility). The limits can be unordered or contain duplication, but
654   // client should not depend on this.
655   static HistogramBase* FactoryGet(const std::string& name,
656                                    const std::vector<Sample>& custom_ranges,
657                                    int32 flags);
658 
659   // Overridden from Histogram:
660   virtual HistogramType GetHistogramType() const OVERRIDE;
661 
662   // Helper method for transforming an array of valid enumeration values
663   // to the std::vector<int> expected by HISTOGRAM_CUSTOM_ENUMERATION.
664   // This function ensures that a guard bucket exists right after any
665   // valid sample value (unless the next higher sample is also a valid value),
666   // so that invalid samples never fall into the same bucket as valid samples.
667   // TODO(kaiwang): Change name to ArrayToCustomEnumRanges.
668   static std::vector<Sample> ArrayToCustomRanges(const Sample* values,
669                                                  size_t num_values);
670  protected:
671   CustomHistogram(const std::string& name,
672                   const BucketRanges* ranges);
673 
674   // HistogramBase implementation:
675   virtual bool SerializeInfoImpl(Pickle* pickle) const OVERRIDE;
676 
677   virtual double GetBucketSize(Count current, size_t i) const OVERRIDE;
678 
679  private:
680   friend BASE_EXPORT_PRIVATE HistogramBase* DeserializeHistogramInfo(
681       PickleIterator* iter);
682   static HistogramBase* DeserializeInfoImpl(PickleIterator* iter);
683 
684   static bool ValidateCustomRanges(const std::vector<Sample>& custom_ranges);
685   static BucketRanges* CreateBucketRangesFromCustomRanges(
686       const std::vector<Sample>& custom_ranges);
687 
688   DISALLOW_COPY_AND_ASSIGN(CustomHistogram);
689 };
690 
691 }  // namespace base
692 
693 #endif  // BASE_METRICS_HISTOGRAM_H_
694