1 /*
2 * Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
11 #include "webrtc/video_engine/overuse_frame_detector.h"
12
13 #include <assert.h>
14 #include <math.h>
15
16 #include <algorithm>
17 #include <list>
18 #include <map>
19
20 #include "webrtc/base/exp_filter.h"
21 #include "webrtc/system_wrappers/interface/clock.h"
22 #include "webrtc/system_wrappers/interface/critical_section_wrapper.h"
23 #include "webrtc/system_wrappers/interface/logging.h"
24
25 namespace webrtc {
26
27 // TODO(mflodman) Test different values for all of these to trigger correctly,
28 // avoid fluctuations etc.
29 namespace {
30 const int64_t kProcessIntervalMs = 5000;
31
32 // Weight factor to apply to the standard deviation.
33 const float kWeightFactor = 0.997f;
34 // Weight factor to apply to the average.
35 const float kWeightFactorMean = 0.98f;
36
37 // Delay between consecutive rampups. (Used for quick recovery.)
38 const int kQuickRampUpDelayMs = 10 * 1000;
39 // Delay between rampup attempts. Initially uses standard, scales up to max.
40 const int kStandardRampUpDelayMs = 40 * 1000;
41 const int kMaxRampUpDelayMs = 240 * 1000;
42 // Expontential back-off factor, to prevent annoying up-down behaviour.
43 const double kRampUpBackoffFactor = 2.0;
44
45 // Max number of overuses detected before always applying the rampup delay.
46 const int kMaxOverusesBeforeApplyRampupDelay = 4;
47
48 // The maximum exponent to use in VCMExpFilter.
49 const float kSampleDiffMs = 33.0f;
50 const float kMaxExp = 7.0f;
51
52 } // namespace
53
Statistics()54 Statistics::Statistics() :
55 sum_(0.0),
56 count_(0),
57 filtered_samples_(new rtc::ExpFilter(kWeightFactorMean)),
58 filtered_variance_(new rtc::ExpFilter(kWeightFactor)) {
59 Reset();
60 }
61
SetOptions(const CpuOveruseOptions & options)62 void Statistics::SetOptions(const CpuOveruseOptions& options) {
63 options_ = options;
64 }
65
Reset()66 void Statistics::Reset() {
67 sum_ = 0.0;
68 count_ = 0;
69 filtered_variance_->Reset(kWeightFactor);
70 filtered_variance_->Apply(1.0f, InitialVariance());
71 }
72
AddSample(float sample_ms)73 void Statistics::AddSample(float sample_ms) {
74 sum_ += sample_ms;
75 ++count_;
76
77 if (count_ < static_cast<uint32_t>(options_.min_frame_samples)) {
78 // Initialize filtered samples.
79 filtered_samples_->Reset(kWeightFactorMean);
80 filtered_samples_->Apply(1.0f, InitialMean());
81 return;
82 }
83
84 float exp = sample_ms / kSampleDiffMs;
85 exp = std::min(exp, kMaxExp);
86 filtered_samples_->Apply(exp, sample_ms);
87 filtered_variance_->Apply(exp, (sample_ms - filtered_samples_->filtered()) *
88 (sample_ms - filtered_samples_->filtered()));
89 }
90
InitialMean() const91 float Statistics::InitialMean() const {
92 if (count_ == 0)
93 return 0.0;
94 return sum_ / count_;
95 }
96
InitialVariance() const97 float Statistics::InitialVariance() const {
98 // Start in between the underuse and overuse threshold.
99 float average_stddev = (options_.low_capture_jitter_threshold_ms +
100 options_.high_capture_jitter_threshold_ms) / 2.0f;
101 return average_stddev * average_stddev;
102 }
103
Mean() const104 float Statistics::Mean() const { return filtered_samples_->filtered(); }
105
StdDev() const106 float Statistics::StdDev() const {
107 return sqrt(std::max(filtered_variance_->filtered(), 0.0f));
108 }
109
Count() const110 uint64_t Statistics::Count() const { return count_; }
111
112
113 // Class for calculating the average encode time.
114 class OveruseFrameDetector::EncodeTimeAvg {
115 public:
EncodeTimeAvg()116 EncodeTimeAvg()
117 : kWeightFactor(0.5f),
118 kInitialAvgEncodeTimeMs(5.0f),
119 filtered_encode_time_ms_(new rtc::ExpFilter(kWeightFactor)) {
120 filtered_encode_time_ms_->Apply(1.0f, kInitialAvgEncodeTimeMs);
121 }
~EncodeTimeAvg()122 ~EncodeTimeAvg() {}
123
AddEncodeSample(float encode_time_ms,int64_t diff_last_sample_ms)124 void AddEncodeSample(float encode_time_ms, int64_t diff_last_sample_ms) {
125 float exp = diff_last_sample_ms / kSampleDiffMs;
126 exp = std::min(exp, kMaxExp);
127 filtered_encode_time_ms_->Apply(exp, encode_time_ms);
128 }
129
Value() const130 int Value() const {
131 return static_cast<int>(filtered_encode_time_ms_->filtered() + 0.5);
132 }
133
134 private:
135 const float kWeightFactor;
136 const float kInitialAvgEncodeTimeMs;
137 scoped_ptr<rtc::ExpFilter> filtered_encode_time_ms_;
138 };
139
140 // Class for calculating the encode usage.
141 class OveruseFrameDetector::EncodeUsage {
142 public:
EncodeUsage()143 EncodeUsage()
144 : kWeightFactorFrameDiff(0.998f),
145 kWeightFactorEncodeTime(0.995f),
146 kInitialSampleDiffMs(40.0f),
147 kMaxSampleDiffMs(45.0f),
148 count_(0),
149 filtered_encode_time_ms_(new rtc::ExpFilter(kWeightFactorEncodeTime)),
150 filtered_frame_diff_ms_(new rtc::ExpFilter(kWeightFactorFrameDiff)) {
151 Reset();
152 }
~EncodeUsage()153 ~EncodeUsage() {}
154
SetOptions(const CpuOveruseOptions & options)155 void SetOptions(const CpuOveruseOptions& options) {
156 options_ = options;
157 }
158
Reset()159 void Reset() {
160 count_ = 0;
161 filtered_frame_diff_ms_->Reset(kWeightFactorFrameDiff);
162 filtered_frame_diff_ms_->Apply(1.0f, kInitialSampleDiffMs);
163 filtered_encode_time_ms_->Reset(kWeightFactorEncodeTime);
164 filtered_encode_time_ms_->Apply(1.0f, InitialEncodeTimeMs());
165 }
166
AddSample(float sample_ms)167 void AddSample(float sample_ms) {
168 float exp = sample_ms / kSampleDiffMs;
169 exp = std::min(exp, kMaxExp);
170 filtered_frame_diff_ms_->Apply(exp, sample_ms);
171 }
172
AddEncodeSample(float encode_time_ms,int64_t diff_last_sample_ms)173 void AddEncodeSample(float encode_time_ms, int64_t diff_last_sample_ms) {
174 ++count_;
175 float exp = diff_last_sample_ms / kSampleDiffMs;
176 exp = std::min(exp, kMaxExp);
177 filtered_encode_time_ms_->Apply(exp, encode_time_ms);
178 }
179
Value() const180 int Value() const {
181 if (count_ < static_cast<uint32_t>(options_.min_frame_samples)) {
182 return static_cast<int>(InitialUsageInPercent() + 0.5f);
183 }
184 float frame_diff_ms = std::max(filtered_frame_diff_ms_->filtered(), 1.0f);
185 frame_diff_ms = std::min(frame_diff_ms, kMaxSampleDiffMs);
186 float encode_usage_percent =
187 100.0f * filtered_encode_time_ms_->filtered() / frame_diff_ms;
188 return static_cast<int>(encode_usage_percent + 0.5);
189 }
190
191 private:
InitialUsageInPercent() const192 float InitialUsageInPercent() const {
193 // Start in between the underuse and overuse threshold.
194 return (options_.low_encode_usage_threshold_percent +
195 options_.high_encode_usage_threshold_percent) / 2.0f;
196 }
197
InitialEncodeTimeMs() const198 float InitialEncodeTimeMs() const {
199 return InitialUsageInPercent() * kInitialSampleDiffMs / 100;
200 }
201
202 const float kWeightFactorFrameDiff;
203 const float kWeightFactorEncodeTime;
204 const float kInitialSampleDiffMs;
205 const float kMaxSampleDiffMs;
206 uint64_t count_;
207 CpuOveruseOptions options_;
208 scoped_ptr<rtc::ExpFilter> filtered_encode_time_ms_;
209 scoped_ptr<rtc::ExpFilter> filtered_frame_diff_ms_;
210 };
211
212 // Class for calculating the relative standard deviation of encode times.
213 class OveruseFrameDetector::EncodeTimeRsd {
214 public:
EncodeTimeRsd(Clock * clock)215 EncodeTimeRsd(Clock* clock)
216 : kWeightFactor(0.6f),
217 count_(0),
218 filtered_rsd_(new rtc::ExpFilter(kWeightFactor)),
219 hist_samples_(0),
220 hist_sum_(0.0f),
221 last_process_time_ms_(clock->TimeInMilliseconds()) {
222 Reset();
223 }
~EncodeTimeRsd()224 ~EncodeTimeRsd() {}
225
SetOptions(const CpuOveruseOptions & options)226 void SetOptions(const CpuOveruseOptions& options) {
227 options_ = options;
228 }
229
Reset()230 void Reset() {
231 count_ = 0;
232 filtered_rsd_->Reset(kWeightFactor);
233 filtered_rsd_->Apply(1.0f, InitialValue());
234 hist_.clear();
235 hist_samples_ = 0;
236 hist_sum_ = 0.0f;
237 }
238
AddEncodeSample(float encode_time_ms)239 void AddEncodeSample(float encode_time_ms) {
240 int bin = static_cast<int>(encode_time_ms + 0.5f);
241 if (bin <= 0) {
242 // The frame was probably not encoded, skip possible dropped frame.
243 return;
244 }
245 ++count_;
246 ++hist_[bin];
247 ++hist_samples_;
248 hist_sum_ += bin;
249 }
250
Process(int64_t now)251 void Process(int64_t now) {
252 if (count_ < static_cast<uint32_t>(options_.min_frame_samples)) {
253 // Have not received min number of frames since last reset.
254 return;
255 }
256 const int kMinHistSamples = 20;
257 if (hist_samples_ < kMinHistSamples) {
258 return;
259 }
260 const int64_t kMinDiffSinceLastProcessMs = 1000;
261 int64_t diff_last_process_ms = now - last_process_time_ms_;
262 if (now - last_process_time_ms_ <= kMinDiffSinceLastProcessMs) {
263 return;
264 }
265 last_process_time_ms_ = now;
266
267 // Calculate variance (using samples above the mean).
268 // Checks for a larger encode time of some frames while there is a small
269 // increase in the average time.
270 int mean = hist_sum_ / hist_samples_;
271 float variance = 0.0f;
272 int total_count = 0;
273 for (std::map<int,int>::iterator it = hist_.begin();
274 it != hist_.end(); ++it) {
275 int time = it->first;
276 int count = it->second;
277 if (time > mean) {
278 total_count += count;
279 for (int i = 0; i < count; ++i) {
280 variance += ((time - mean) * (time - mean));
281 }
282 }
283 }
284 variance /= std::max(total_count, 1);
285 float cov = sqrt(variance) / mean;
286
287 hist_.clear();
288 hist_samples_ = 0;
289 hist_sum_ = 0.0f;
290
291 float exp = static_cast<float>(diff_last_process_ms) / kProcessIntervalMs;
292 exp = std::min(exp, kMaxExp);
293 filtered_rsd_->Apply(exp, 100.0f * cov);
294 }
295
Value() const296 int Value() const {
297 return static_cast<int>(filtered_rsd_->filtered() + 0.5);
298 }
299
300 private:
InitialValue() const301 float InitialValue() const {
302 // Start in between the underuse and overuse threshold.
303 return std::max(((options_.low_encode_time_rsd_threshold +
304 options_.high_encode_time_rsd_threshold) / 2.0f), 0.0f);
305 }
306
307 const float kWeightFactor;
308 uint32_t count_; // Number of encode samples since last reset.
309 CpuOveruseOptions options_;
310 scoped_ptr<rtc::ExpFilter> filtered_rsd_;
311 int hist_samples_;
312 float hist_sum_;
313 std::map<int,int> hist_; // Histogram of encode time of frames.
314 int64_t last_process_time_ms_;
315 };
316
317 // Class for calculating the capture queue delay change.
318 class OveruseFrameDetector::CaptureQueueDelay {
319 public:
CaptureQueueDelay()320 CaptureQueueDelay()
321 : kWeightFactor(0.5f),
322 delay_ms_(0),
323 filtered_delay_ms_per_s_(new rtc::ExpFilter(kWeightFactor)) {
324 filtered_delay_ms_per_s_->Apply(1.0f, 0.0f);
325 }
~CaptureQueueDelay()326 ~CaptureQueueDelay() {}
327
FrameCaptured(int64_t now)328 void FrameCaptured(int64_t now) {
329 const size_t kMaxSize = 200;
330 if (frames_.size() > kMaxSize) {
331 frames_.pop_front();
332 }
333 frames_.push_back(now);
334 }
335
FrameProcessingStarted(int64_t now)336 void FrameProcessingStarted(int64_t now) {
337 if (frames_.empty()) {
338 return;
339 }
340 delay_ms_ = now - frames_.front();
341 frames_.pop_front();
342 }
343
CalculateDelayChange(int64_t diff_last_sample_ms)344 void CalculateDelayChange(int64_t diff_last_sample_ms) {
345 if (diff_last_sample_ms <= 0) {
346 return;
347 }
348 float exp = static_cast<float>(diff_last_sample_ms) / kProcessIntervalMs;
349 exp = std::min(exp, kMaxExp);
350 filtered_delay_ms_per_s_->Apply(exp,
351 delay_ms_ * 1000.0f / diff_last_sample_ms);
352 ClearFrames();
353 }
354
ClearFrames()355 void ClearFrames() {
356 frames_.clear();
357 }
358
delay_ms() const359 int delay_ms() const {
360 return delay_ms_;
361 }
362
Value() const363 int Value() const {
364 return static_cast<int>(filtered_delay_ms_per_s_->filtered() + 0.5);
365 }
366
367 private:
368 const float kWeightFactor;
369 std::list<int64_t> frames_;
370 int delay_ms_;
371 scoped_ptr<rtc::ExpFilter> filtered_delay_ms_per_s_;
372 };
373
OveruseFrameDetector(Clock * clock)374 OveruseFrameDetector::OveruseFrameDetector(Clock* clock)
375 : crit_(CriticalSectionWrapper::CreateCriticalSection()),
376 observer_(NULL),
377 clock_(clock),
378 next_process_time_(clock_->TimeInMilliseconds()),
379 num_process_times_(0),
380 last_capture_time_(0),
381 last_overuse_time_(0),
382 checks_above_threshold_(0),
383 num_overuse_detections_(0),
384 last_rampup_time_(0),
385 in_quick_rampup_(false),
386 current_rampup_delay_ms_(kStandardRampUpDelayMs),
387 num_pixels_(0),
388 last_encode_sample_ms_(0),
389 encode_time_(new EncodeTimeAvg()),
390 encode_rsd_(new EncodeTimeRsd(clock)),
391 encode_usage_(new EncodeUsage()),
392 capture_queue_delay_(new CaptureQueueDelay()) {
393 }
394
~OveruseFrameDetector()395 OveruseFrameDetector::~OveruseFrameDetector() {
396 }
397
SetObserver(CpuOveruseObserver * observer)398 void OveruseFrameDetector::SetObserver(CpuOveruseObserver* observer) {
399 CriticalSectionScoped cs(crit_.get());
400 observer_ = observer;
401 }
402
SetOptions(const CpuOveruseOptions & options)403 void OveruseFrameDetector::SetOptions(const CpuOveruseOptions& options) {
404 assert(options.min_frame_samples > 0);
405 CriticalSectionScoped cs(crit_.get());
406 if (options_.Equals(options)) {
407 return;
408 }
409 options_ = options;
410 capture_deltas_.SetOptions(options);
411 encode_usage_->SetOptions(options);
412 encode_rsd_->SetOptions(options);
413 ResetAll(num_pixels_);
414 }
415
CaptureQueueDelayMsPerS() const416 int OveruseFrameDetector::CaptureQueueDelayMsPerS() const {
417 CriticalSectionScoped cs(crit_.get());
418 return capture_queue_delay_->delay_ms();
419 }
420
GetCpuOveruseMetrics(CpuOveruseMetrics * metrics) const421 void OveruseFrameDetector::GetCpuOveruseMetrics(
422 CpuOveruseMetrics* metrics) const {
423 CriticalSectionScoped cs(crit_.get());
424 metrics->capture_jitter_ms = static_cast<int>(capture_deltas_.StdDev() + 0.5);
425 metrics->avg_encode_time_ms = encode_time_->Value();
426 metrics->encode_rsd = encode_rsd_->Value();
427 metrics->encode_usage_percent = encode_usage_->Value();
428 metrics->capture_queue_delay_ms_per_s = capture_queue_delay_->Value();
429 }
430
TimeUntilNextProcess()431 int32_t OveruseFrameDetector::TimeUntilNextProcess() {
432 CriticalSectionScoped cs(crit_.get());
433 return next_process_time_ - clock_->TimeInMilliseconds();
434 }
435
FrameSizeChanged(int num_pixels) const436 bool OveruseFrameDetector::FrameSizeChanged(int num_pixels) const {
437 if (num_pixels != num_pixels_) {
438 return true;
439 }
440 return false;
441 }
442
FrameTimeoutDetected(int64_t now) const443 bool OveruseFrameDetector::FrameTimeoutDetected(int64_t now) const {
444 if (last_capture_time_ == 0) {
445 return false;
446 }
447 return (now - last_capture_time_) > options_.frame_timeout_interval_ms;
448 }
449
ResetAll(int num_pixels)450 void OveruseFrameDetector::ResetAll(int num_pixels) {
451 num_pixels_ = num_pixels;
452 capture_deltas_.Reset();
453 encode_usage_->Reset();
454 encode_rsd_->Reset();
455 capture_queue_delay_->ClearFrames();
456 last_capture_time_ = 0;
457 num_process_times_ = 0;
458 }
459
FrameCaptured(int width,int height)460 void OveruseFrameDetector::FrameCaptured(int width, int height) {
461 CriticalSectionScoped cs(crit_.get());
462
463 int64_t now = clock_->TimeInMilliseconds();
464 if (FrameSizeChanged(width * height) || FrameTimeoutDetected(now)) {
465 ResetAll(width * height);
466 }
467
468 if (last_capture_time_ != 0) {
469 capture_deltas_.AddSample(now - last_capture_time_);
470 encode_usage_->AddSample(now - last_capture_time_);
471 }
472 last_capture_time_ = now;
473
474 capture_queue_delay_->FrameCaptured(now);
475 }
476
FrameProcessingStarted()477 void OveruseFrameDetector::FrameProcessingStarted() {
478 CriticalSectionScoped cs(crit_.get());
479 capture_queue_delay_->FrameProcessingStarted(clock_->TimeInMilliseconds());
480 }
481
FrameEncoded(int encode_time_ms)482 void OveruseFrameDetector::FrameEncoded(int encode_time_ms) {
483 CriticalSectionScoped cs(crit_.get());
484 int64_t time = clock_->TimeInMilliseconds();
485 if (last_encode_sample_ms_ != 0) {
486 int64_t diff_ms = time - last_encode_sample_ms_;
487 encode_time_->AddEncodeSample(encode_time_ms, diff_ms);
488 encode_usage_->AddEncodeSample(encode_time_ms, diff_ms);
489 encode_rsd_->AddEncodeSample(encode_time_ms);
490 }
491 last_encode_sample_ms_ = time;
492 }
493
Process()494 int32_t OveruseFrameDetector::Process() {
495 CriticalSectionScoped cs(crit_.get());
496
497 int64_t now = clock_->TimeInMilliseconds();
498
499 // Used to protect against Process() being called too often.
500 if (now < next_process_time_)
501 return 0;
502
503 int64_t diff_ms = now - next_process_time_ + kProcessIntervalMs;
504 next_process_time_ = now + kProcessIntervalMs;
505 ++num_process_times_;
506
507 encode_rsd_->Process(now);
508 capture_queue_delay_->CalculateDelayChange(diff_ms);
509
510 if (num_process_times_ <= options_.min_process_count) {
511 return 0;
512 }
513
514 if (IsOverusing()) {
515 // If the last thing we did was going up, and now have to back down, we need
516 // to check if this peak was short. If so we should back off to avoid going
517 // back and forth between this load, the system doesn't seem to handle it.
518 bool check_for_backoff = last_rampup_time_ > last_overuse_time_;
519 if (check_for_backoff) {
520 if (now - last_rampup_time_ < kStandardRampUpDelayMs ||
521 num_overuse_detections_ > kMaxOverusesBeforeApplyRampupDelay) {
522 // Going up was not ok for very long, back off.
523 current_rampup_delay_ms_ *= kRampUpBackoffFactor;
524 if (current_rampup_delay_ms_ > kMaxRampUpDelayMs)
525 current_rampup_delay_ms_ = kMaxRampUpDelayMs;
526 } else {
527 // Not currently backing off, reset rampup delay.
528 current_rampup_delay_ms_ = kStandardRampUpDelayMs;
529 }
530 }
531
532 last_overuse_time_ = now;
533 in_quick_rampup_ = false;
534 checks_above_threshold_ = 0;
535 ++num_overuse_detections_;
536
537 if (observer_ != NULL)
538 observer_->OveruseDetected();
539 } else if (IsUnderusing(now)) {
540 last_rampup_time_ = now;
541 in_quick_rampup_ = true;
542
543 if (observer_ != NULL)
544 observer_->NormalUsage();
545 }
546
547 int rampup_delay =
548 in_quick_rampup_ ? kQuickRampUpDelayMs : current_rampup_delay_ms_;
549 LOG(LS_VERBOSE) << " Frame stats: capture avg: " << capture_deltas_.Mean()
550 << " capture stddev " << capture_deltas_.StdDev()
551 << " encode usage " << encode_usage_->Value()
552 << " encode rsd " << encode_rsd_->Value()
553 << " overuse detections " << num_overuse_detections_
554 << " rampup delay " << rampup_delay;
555 return 0;
556 }
557
IsOverusing()558 bool OveruseFrameDetector::IsOverusing() {
559 bool overusing = false;
560 if (options_.enable_capture_jitter_method) {
561 overusing = capture_deltas_.StdDev() >=
562 options_.high_capture_jitter_threshold_ms;
563 } else if (options_.enable_encode_usage_method) {
564 bool encode_usage_overuse =
565 encode_usage_->Value() >= options_.high_encode_usage_threshold_percent;
566 bool encode_rsd_overuse = false;
567 if (options_.high_encode_time_rsd_threshold > 0) {
568 encode_rsd_overuse =
569 (encode_rsd_->Value() >= options_.high_encode_time_rsd_threshold);
570 }
571 overusing = encode_usage_overuse || encode_rsd_overuse;
572 }
573
574 if (overusing) {
575 ++checks_above_threshold_;
576 } else {
577 checks_above_threshold_ = 0;
578 }
579 return checks_above_threshold_ >= options_.high_threshold_consecutive_count;
580 }
581
IsUnderusing(int64_t time_now)582 bool OveruseFrameDetector::IsUnderusing(int64_t time_now) {
583 int delay = in_quick_rampup_ ? kQuickRampUpDelayMs : current_rampup_delay_ms_;
584 if (time_now < last_rampup_time_ + delay)
585 return false;
586
587 bool underusing = false;
588 if (options_.enable_capture_jitter_method) {
589 underusing = capture_deltas_.StdDev() <
590 options_.low_capture_jitter_threshold_ms;
591 } else if (options_.enable_encode_usage_method) {
592 bool encode_usage_underuse =
593 encode_usage_->Value() < options_.low_encode_usage_threshold_percent;
594 bool encode_rsd_underuse = true;
595 if (options_.low_encode_time_rsd_threshold > 0) {
596 encode_rsd_underuse =
597 (encode_rsd_->Value() < options_.low_encode_time_rsd_threshold);
598 }
599 underusing = encode_usage_underuse && encode_rsd_underuse;
600 }
601 return underusing;
602 }
603 } // namespace webrtc
604