Home | History | Annotate | Download | only in video_engine
      1 /*
      2  *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
      3  *
      4  *  Use of this source code is governed by a BSD-style license
      5  *  that can be found in the LICENSE file in the root of the source
      6  *  tree. An additional intellectual property rights grant can be found
      7  *  in the file PATENTS.  All contributing project authors may
      8  *  be found in the AUTHORS file in the root of the source tree.
      9  */
     10 
     11 #include "webrtc/video_engine/overuse_frame_detector.h"
     12 
     13 #include <assert.h>
     14 #include <math.h>
     15 
     16 #include <algorithm>
     17 #include <list>
     18 #include <map>
     19 
     20 #include "webrtc/modules/video_coding/utility/include/exp_filter.h"
     21 #include "webrtc/system_wrappers/interface/clock.h"
     22 #include "webrtc/system_wrappers/interface/critical_section_wrapper.h"
     23 #include "webrtc/system_wrappers/interface/logging.h"
     24 
     25 namespace webrtc {
     26 
     27 // TODO(mflodman) Test different values for all of these to trigger correctly,
     28 // avoid fluctuations etc.
     29 namespace {
     30 const int64_t kProcessIntervalMs = 5000;
     31 
     32 // Weight factor to apply to the standard deviation.
     33 const float kWeightFactor = 0.997f;
     34 // Weight factor to apply to the average.
     35 const float kWeightFactorMean = 0.98f;
     36 
     37 // Delay between consecutive rampups. (Used for quick recovery.)
     38 const int kQuickRampUpDelayMs = 10 * 1000;
     39 // Delay between rampup attempts. Initially uses standard, scales up to max.
     40 const int kStandardRampUpDelayMs = 30 * 1000;
     41 const int kMaxRampUpDelayMs = 240 * 1000;
     42 // Expontential back-off factor, to prevent annoying up-down behaviour.
     43 const double kRampUpBackoffFactor = 2.0;
     44 
     45 // Max number of overuses detected before always applying the rampup delay.
     46 const int kMaxOverusesBeforeApplyRampupDelay = 7;
     47 
     48 // The maximum exponent to use in VCMExpFilter.
     49 const float kSampleDiffMs = 33.0f;
     50 const float kMaxExp = 7.0f;
     51 
     52 }  // namespace
     53 
     54 Statistics::Statistics() :
     55     sum_(0.0),
     56     count_(0),
     57     filtered_samples_(new VCMExpFilter(kWeightFactorMean)),
     58     filtered_variance_(new VCMExpFilter(kWeightFactor)) {
     59   Reset();
     60 }
     61 
     62 void Statistics::SetOptions(const CpuOveruseOptions& options) {
     63   options_ = options;
     64 }
     65 
     66 void Statistics::Reset() {
     67   sum_ =  0.0;
     68   count_ = 0;
     69   filtered_variance_->Reset(kWeightFactor);
     70   filtered_variance_->Apply(1.0f, InitialVariance());
     71 }
     72 
     73 void Statistics::AddSample(float sample_ms) {
     74   sum_ += sample_ms;
     75   ++count_;
     76 
     77   if (count_ < static_cast<uint32_t>(options_.min_frame_samples)) {
     78     // Initialize filtered samples.
     79     filtered_samples_->Reset(kWeightFactorMean);
     80     filtered_samples_->Apply(1.0f, InitialMean());
     81     return;
     82   }
     83 
     84   float exp = sample_ms / kSampleDiffMs;
     85   exp = std::min(exp, kMaxExp);
     86   filtered_samples_->Apply(exp, sample_ms);
     87   filtered_variance_->Apply(exp, (sample_ms - filtered_samples_->Value()) *
     88                                  (sample_ms - filtered_samples_->Value()));
     89 }
     90 
     91 float Statistics::InitialMean() const {
     92   if (count_ == 0)
     93     return 0.0;
     94   return sum_ / count_;
     95 }
     96 
     97 float Statistics::InitialVariance() const {
     98   // Start in between the underuse and overuse threshold.
     99   float average_stddev = (options_.low_capture_jitter_threshold_ms +
    100                           options_.high_capture_jitter_threshold_ms) / 2.0f;
    101   return average_stddev * average_stddev;
    102 }
    103 
    104 float Statistics::Mean() const { return filtered_samples_->Value(); }
    105 
    106 float Statistics::StdDev() const {
    107   return sqrt(std::max(filtered_variance_->Value(), 0.0f));
    108 }
    109 
    110 uint64_t Statistics::Count() const { return count_; }
    111 
    112 
    113 // Class for calculating the average encode time.
    114 class OveruseFrameDetector::EncodeTimeAvg {
    115  public:
    116   EncodeTimeAvg()
    117       : kWeightFactor(0.5f),
    118         kInitialAvgEncodeTimeMs(5.0f),
    119         filtered_encode_time_ms_(new VCMExpFilter(kWeightFactor)) {
    120     filtered_encode_time_ms_->Apply(1.0f, kInitialAvgEncodeTimeMs);
    121   }
    122   ~EncodeTimeAvg() {}
    123 
    124   void AddEncodeSample(float encode_time_ms, int64_t diff_last_sample_ms) {
    125     float exp =  diff_last_sample_ms / kSampleDiffMs;
    126     exp = std::min(exp, kMaxExp);
    127     filtered_encode_time_ms_->Apply(exp, encode_time_ms);
    128   }
    129 
    130   int Value() const {
    131     return static_cast<int>(filtered_encode_time_ms_->Value() + 0.5);
    132   }
    133 
    134  private:
    135   const float kWeightFactor;
    136   const float kInitialAvgEncodeTimeMs;
    137   scoped_ptr<VCMExpFilter> filtered_encode_time_ms_;
    138 };
    139 
    140 // Class for calculating the encode usage.
    141 class OveruseFrameDetector::EncodeUsage {
    142  public:
    143   EncodeUsage()
    144       : kWeightFactorFrameDiff(0.998f),
    145         kWeightFactorEncodeTime(0.995f),
    146         kInitialSampleDiffMs(40.0f),
    147         kMaxSampleDiffMs(45.0f),
    148         count_(0),
    149         filtered_encode_time_ms_(new VCMExpFilter(kWeightFactorEncodeTime)),
    150         filtered_frame_diff_ms_(new VCMExpFilter(kWeightFactorFrameDiff)) {
    151     Reset();
    152   }
    153   ~EncodeUsage() {}
    154 
    155   void SetOptions(const CpuOveruseOptions& options) {
    156     options_ = options;
    157   }
    158 
    159   void Reset() {
    160     count_ = 0;
    161     filtered_frame_diff_ms_->Reset(kWeightFactorFrameDiff);
    162     filtered_frame_diff_ms_->Apply(1.0f, kInitialSampleDiffMs);
    163     filtered_encode_time_ms_->Reset(kWeightFactorEncodeTime);
    164     filtered_encode_time_ms_->Apply(1.0f, InitialEncodeTimeMs());
    165   }
    166 
    167   void AddSample(float sample_ms) {
    168     float exp = sample_ms / kSampleDiffMs;
    169     exp = std::min(exp, kMaxExp);
    170     filtered_frame_diff_ms_->Apply(exp, sample_ms);
    171   }
    172 
    173   void AddEncodeSample(float encode_time_ms, int64_t diff_last_sample_ms) {
    174     ++count_;
    175     float exp = diff_last_sample_ms / kSampleDiffMs;
    176     exp = std::min(exp, kMaxExp);
    177     filtered_encode_time_ms_->Apply(exp, encode_time_ms);
    178   }
    179 
    180   int Value() const {
    181     if (count_ < static_cast<uint32_t>(options_.min_frame_samples)) {
    182       return static_cast<int>(InitialUsageInPercent() + 0.5f);
    183     }
    184     float frame_diff_ms = std::max(filtered_frame_diff_ms_->Value(), 1.0f);
    185     frame_diff_ms = std::min(frame_diff_ms, kMaxSampleDiffMs);
    186     float encode_usage_percent =
    187         100.0f * filtered_encode_time_ms_->Value() / frame_diff_ms;
    188     return static_cast<int>(encode_usage_percent + 0.5);
    189   }
    190 
    191  private:
    192   float InitialUsageInPercent() const {
    193     // Start in between the underuse and overuse threshold.
    194     return (options_.low_encode_usage_threshold_percent +
    195             options_.high_encode_usage_threshold_percent) / 2.0f;
    196   }
    197 
    198   float InitialEncodeTimeMs() const {
    199     return InitialUsageInPercent() * kInitialSampleDiffMs / 100;
    200   }
    201 
    202   const float kWeightFactorFrameDiff;
    203   const float kWeightFactorEncodeTime;
    204   const float kInitialSampleDiffMs;
    205   const float kMaxSampleDiffMs;
    206   uint64_t count_;
    207   CpuOveruseOptions options_;
    208   scoped_ptr<VCMExpFilter> filtered_encode_time_ms_;
    209   scoped_ptr<VCMExpFilter> filtered_frame_diff_ms_;
    210 };
    211 
    212 // Class for calculating the relative standard deviation of encode times.
    213 class OveruseFrameDetector::EncodeTimeRsd {
    214  public:
    215   EncodeTimeRsd(Clock* clock)
    216       : kWeightFactor(0.6f),
    217         count_(0),
    218         filtered_rsd_(new VCMExpFilter(kWeightFactor)),
    219         hist_samples_(0),
    220         hist_sum_(0.0f),
    221         last_process_time_ms_(clock->TimeInMilliseconds()) {
    222     Reset();
    223   }
    224   ~EncodeTimeRsd() {}
    225 
    226   void SetOptions(const CpuOveruseOptions& options) {
    227     options_ = options;
    228   }
    229 
    230   void Reset() {
    231     count_ = 0;
    232     filtered_rsd_->Reset(kWeightFactor);
    233     filtered_rsd_->Apply(1.0f, InitialValue());
    234     hist_.clear();
    235     hist_samples_ = 0;
    236     hist_sum_ = 0.0f;
    237   }
    238 
    239   void AddEncodeSample(float encode_time_ms) {
    240     int bin = static_cast<int>(encode_time_ms + 0.5f);
    241     if (bin <= 0) {
    242       // The frame was probably not encoded, skip possible dropped frame.
    243       return;
    244     }
    245     ++count_;
    246     ++hist_[bin];
    247     ++hist_samples_;
    248     hist_sum_ += bin;
    249   }
    250 
    251   void Process(int64_t now) {
    252     if (count_ < static_cast<uint32_t>(options_.min_frame_samples)) {
    253       // Have not received min number of frames since last reset.
    254       return;
    255     }
    256     const int kMinHistSamples = 20;
    257     if (hist_samples_ < kMinHistSamples) {
    258       return;
    259     }
    260     const int64_t kMinDiffSinceLastProcessMs = 1000;
    261     int64_t diff_last_process_ms = now - last_process_time_ms_;
    262     if (now - last_process_time_ms_ <= kMinDiffSinceLastProcessMs) {
    263       return;
    264     }
    265     last_process_time_ms_ = now;
    266 
    267     // Calculate variance (using samples above the mean).
    268     // Checks for a larger encode time of some frames while there is a small
    269     // increase in the average time.
    270     int mean = hist_sum_ / hist_samples_;
    271     float variance = 0.0f;
    272     int total_count = 0;
    273     for (std::map<int,int>::iterator it = hist_.begin();
    274          it != hist_.end(); ++it) {
    275       int time = it->first;
    276       int count = it->second;
    277       if (time > mean) {
    278         total_count += count;
    279         for (int i = 0; i < count; ++i) {
    280           variance += ((time - mean) * (time - mean));
    281         }
    282       }
    283     }
    284     variance /= std::max(total_count, 1);
    285     float cov = sqrt(variance) / mean;
    286 
    287     hist_.clear();
    288     hist_samples_ = 0;
    289     hist_sum_ = 0.0f;
    290 
    291     float exp = static_cast<float>(diff_last_process_ms) / kProcessIntervalMs;
    292     exp = std::min(exp, kMaxExp);
    293     filtered_rsd_->Apply(exp, 100.0f * cov);
    294   }
    295 
    296   int Value() const {
    297     return static_cast<int>(filtered_rsd_->Value() + 0.5);
    298   }
    299 
    300  private:
    301   float InitialValue() const {
    302     // Start in between the underuse and overuse threshold.
    303     return std::max(((options_.low_encode_time_rsd_threshold +
    304                       options_.high_encode_time_rsd_threshold) / 2.0f), 0.0f);
    305   }
    306 
    307   const float kWeightFactor;
    308   uint32_t count_;  // Number of encode samples since last reset.
    309   CpuOveruseOptions options_;
    310   scoped_ptr<VCMExpFilter> filtered_rsd_;
    311   int hist_samples_;
    312   float hist_sum_;
    313   std::map<int,int> hist_;  // Histogram of encode time of frames.
    314   int64_t last_process_time_ms_;
    315 };
    316 
    317 // Class for calculating the capture queue delay change.
    318 class OveruseFrameDetector::CaptureQueueDelay {
    319  public:
    320   CaptureQueueDelay()
    321       : kWeightFactor(0.5f),
    322         delay_ms_(0),
    323         filtered_delay_ms_per_s_(new VCMExpFilter(kWeightFactor)) {
    324     filtered_delay_ms_per_s_->Apply(1.0f, 0.0f);
    325   }
    326   ~CaptureQueueDelay() {}
    327 
    328   void FrameCaptured(int64_t now) {
    329     const size_t kMaxSize = 200;
    330     if (frames_.size() > kMaxSize) {
    331       frames_.pop_front();
    332     }
    333     frames_.push_back(now);
    334   }
    335 
    336   void FrameProcessingStarted(int64_t now) {
    337     if (frames_.empty()) {
    338       return;
    339     }
    340     delay_ms_ = now - frames_.front();
    341     frames_.pop_front();
    342   }
    343 
    344   void CalculateDelayChange(int64_t diff_last_sample_ms) {
    345     if (diff_last_sample_ms <= 0) {
    346       return;
    347     }
    348     float exp = static_cast<float>(diff_last_sample_ms) / kProcessIntervalMs;
    349     exp = std::min(exp, kMaxExp);
    350     filtered_delay_ms_per_s_->Apply(exp,
    351                                     delay_ms_ * 1000.0f / diff_last_sample_ms);
    352     ClearFrames();
    353   }
    354 
    355   void ClearFrames() {
    356     frames_.clear();
    357   }
    358 
    359   int delay_ms() const {
    360     return delay_ms_;
    361   }
    362 
    363   int Value() const {
    364     return static_cast<int>(filtered_delay_ms_per_s_->Value() + 0.5);
    365   }
    366 
    367  private:
    368   const float kWeightFactor;
    369   std::list<int64_t> frames_;
    370   int delay_ms_;
    371   scoped_ptr<VCMExpFilter> filtered_delay_ms_per_s_;
    372 };
    373 
    374 OveruseFrameDetector::OveruseFrameDetector(Clock* clock)
    375     : crit_(CriticalSectionWrapper::CreateCriticalSection()),
    376       observer_(NULL),
    377       clock_(clock),
    378       next_process_time_(clock_->TimeInMilliseconds()),
    379       num_process_times_(0),
    380       last_capture_time_(0),
    381       last_overuse_time_(0),
    382       checks_above_threshold_(0),
    383       num_overuse_detections_(0),
    384       last_rampup_time_(0),
    385       in_quick_rampup_(false),
    386       current_rampup_delay_ms_(kStandardRampUpDelayMs),
    387       num_pixels_(0),
    388       last_encode_sample_ms_(0),
    389       encode_time_(new EncodeTimeAvg()),
    390       encode_rsd_(new EncodeTimeRsd(clock)),
    391       encode_usage_(new EncodeUsage()),
    392       capture_queue_delay_(new CaptureQueueDelay()) {
    393 }
    394 
    395 OveruseFrameDetector::~OveruseFrameDetector() {
    396 }
    397 
    398 void OveruseFrameDetector::SetObserver(CpuOveruseObserver* observer) {
    399   CriticalSectionScoped cs(crit_.get());
    400   observer_ = observer;
    401 }
    402 
    403 void OveruseFrameDetector::SetOptions(const CpuOveruseOptions& options) {
    404   assert(options.min_frame_samples > 0);
    405   CriticalSectionScoped cs(crit_.get());
    406   if (options_.Equals(options)) {
    407     return;
    408   }
    409   options_ = options;
    410   capture_deltas_.SetOptions(options);
    411   encode_usage_->SetOptions(options);
    412   encode_rsd_->SetOptions(options);
    413   ResetAll(num_pixels_);
    414 }
    415 
    416 int OveruseFrameDetector::CaptureQueueDelayMsPerS() const {
    417   CriticalSectionScoped cs(crit_.get());
    418   return capture_queue_delay_->delay_ms();
    419 }
    420 
    421 void OveruseFrameDetector::GetCpuOveruseMetrics(
    422     CpuOveruseMetrics* metrics) const {
    423   CriticalSectionScoped cs(crit_.get());
    424   metrics->capture_jitter_ms = static_cast<int>(capture_deltas_.StdDev() + 0.5);
    425   metrics->avg_encode_time_ms = encode_time_->Value();
    426   metrics->encode_rsd = encode_rsd_->Value();
    427   metrics->encode_usage_percent = encode_usage_->Value();
    428   metrics->capture_queue_delay_ms_per_s = capture_queue_delay_->Value();
    429 }
    430 
    431 int32_t OveruseFrameDetector::TimeUntilNextProcess() {
    432   CriticalSectionScoped cs(crit_.get());
    433   return next_process_time_ - clock_->TimeInMilliseconds();
    434 }
    435 
    436 bool OveruseFrameDetector::FrameSizeChanged(int num_pixels) const {
    437   if (num_pixels != num_pixels_) {
    438     return true;
    439   }
    440   return false;
    441 }
    442 
    443 bool OveruseFrameDetector::FrameTimeoutDetected(int64_t now) const {
    444   if (last_capture_time_ == 0) {
    445     return false;
    446   }
    447   return (now - last_capture_time_) > options_.frame_timeout_interval_ms;
    448 }
    449 
    450 void OveruseFrameDetector::ResetAll(int num_pixels) {
    451   num_pixels_ = num_pixels;
    452   capture_deltas_.Reset();
    453   encode_usage_->Reset();
    454   encode_rsd_->Reset();
    455   capture_queue_delay_->ClearFrames();
    456   last_capture_time_ = 0;
    457   num_process_times_ = 0;
    458 }
    459 
    460 void OveruseFrameDetector::FrameCaptured(int width, int height) {
    461   CriticalSectionScoped cs(crit_.get());
    462 
    463   int64_t now = clock_->TimeInMilliseconds();
    464   if (FrameSizeChanged(width * height) || FrameTimeoutDetected(now)) {
    465     ResetAll(width * height);
    466   }
    467 
    468   if (last_capture_time_ != 0) {
    469     capture_deltas_.AddSample(now - last_capture_time_);
    470     encode_usage_->AddSample(now - last_capture_time_);
    471   }
    472   last_capture_time_ = now;
    473 
    474   capture_queue_delay_->FrameCaptured(now);
    475 }
    476 
    477 void OveruseFrameDetector::FrameProcessingStarted() {
    478   CriticalSectionScoped cs(crit_.get());
    479   capture_queue_delay_->FrameProcessingStarted(clock_->TimeInMilliseconds());
    480 }
    481 
    482 void OveruseFrameDetector::FrameEncoded(int encode_time_ms) {
    483   CriticalSectionScoped cs(crit_.get());
    484   int64_t time = clock_->TimeInMilliseconds();
    485   if (last_encode_sample_ms_ != 0) {
    486     int64_t diff_ms = time - last_encode_sample_ms_;
    487     encode_time_->AddEncodeSample(encode_time_ms, diff_ms);
    488     encode_usage_->AddEncodeSample(encode_time_ms, diff_ms);
    489     encode_rsd_->AddEncodeSample(encode_time_ms);
    490   }
    491   last_encode_sample_ms_ = time;
    492 }
    493 
    494 int32_t OveruseFrameDetector::Process() {
    495   CriticalSectionScoped cs(crit_.get());
    496 
    497   int64_t now = clock_->TimeInMilliseconds();
    498 
    499   // Used to protect against Process() being called too often.
    500   if (now < next_process_time_)
    501     return 0;
    502 
    503   int64_t diff_ms = now - next_process_time_ + kProcessIntervalMs;
    504   next_process_time_ = now + kProcessIntervalMs;
    505   ++num_process_times_;
    506 
    507   encode_rsd_->Process(now);
    508   capture_queue_delay_->CalculateDelayChange(diff_ms);
    509 
    510   if (num_process_times_ <= options_.min_process_count) {
    511     return 0;
    512   }
    513 
    514   if (IsOverusing()) {
    515     // If the last thing we did was going up, and now have to back down, we need
    516     // to check if this peak was short. If so we should back off to avoid going
    517     // back and forth between this load, the system doesn't seem to handle it.
    518     bool check_for_backoff = last_rampup_time_ > last_overuse_time_;
    519     if (check_for_backoff) {
    520       if (now - last_rampup_time_ < kStandardRampUpDelayMs ||
    521           num_overuse_detections_ > kMaxOverusesBeforeApplyRampupDelay) {
    522         // Going up was not ok for very long, back off.
    523         current_rampup_delay_ms_ *= kRampUpBackoffFactor;
    524         if (current_rampup_delay_ms_ > kMaxRampUpDelayMs)
    525           current_rampup_delay_ms_ = kMaxRampUpDelayMs;
    526       } else {
    527         // Not currently backing off, reset rampup delay.
    528         current_rampup_delay_ms_ = kStandardRampUpDelayMs;
    529       }
    530     }
    531 
    532     last_overuse_time_ = now;
    533     in_quick_rampup_ = false;
    534     checks_above_threshold_ = 0;
    535     ++num_overuse_detections_;
    536 
    537     if (observer_ != NULL)
    538       observer_->OveruseDetected();
    539   } else if (IsUnderusing(now)) {
    540     last_rampup_time_ = now;
    541     in_quick_rampup_ = true;
    542 
    543     if (observer_ != NULL)
    544       observer_->NormalUsage();
    545   }
    546 
    547   int rampup_delay =
    548       in_quick_rampup_ ? kQuickRampUpDelayMs : current_rampup_delay_ms_;
    549   LOG(LS_VERBOSE) << " Frame stats: capture avg: " << capture_deltas_.Mean()
    550                   << " capture stddev " << capture_deltas_.StdDev()
    551                   << " encode usage " << encode_usage_->Value()
    552                   << " encode rsd " << encode_rsd_->Value()
    553                   << " overuse detections " << num_overuse_detections_
    554                   << " rampup delay " << rampup_delay;
    555   return 0;
    556 }
    557 
    558 bool OveruseFrameDetector::IsOverusing() {
    559   bool overusing = false;
    560   if (options_.enable_capture_jitter_method) {
    561     overusing = capture_deltas_.StdDev() >=
    562         options_.high_capture_jitter_threshold_ms;
    563   } else if (options_.enable_encode_usage_method) {
    564     bool encode_usage_overuse =
    565         encode_usage_->Value() >= options_.high_encode_usage_threshold_percent;
    566     bool encode_rsd_overuse = false;
    567     if (options_.high_encode_time_rsd_threshold > 0) {
    568       encode_rsd_overuse =
    569           (encode_rsd_->Value() >= options_.high_encode_time_rsd_threshold);
    570     }
    571     overusing = encode_usage_overuse || encode_rsd_overuse;
    572   }
    573 
    574   if (overusing) {
    575     ++checks_above_threshold_;
    576   } else {
    577     checks_above_threshold_ = 0;
    578   }
    579   return checks_above_threshold_ >= options_.high_threshold_consecutive_count;
    580 }
    581 
    582 bool OveruseFrameDetector::IsUnderusing(int64_t time_now) {
    583   int delay = in_quick_rampup_ ? kQuickRampUpDelayMs : current_rampup_delay_ms_;
    584   if (time_now < last_rampup_time_ + delay)
    585     return false;
    586 
    587   bool underusing = false;
    588   if (options_.enable_capture_jitter_method) {
    589     underusing = capture_deltas_.StdDev() <
    590         options_.low_capture_jitter_threshold_ms;
    591   } else if (options_.enable_encode_usage_method) {
    592     bool encode_usage_underuse =
    593         encode_usage_->Value() < options_.low_encode_usage_threshold_percent;
    594     bool encode_rsd_underuse = true;
    595     if (options_.low_encode_time_rsd_threshold > 0) {
    596       encode_rsd_underuse =
    597           (encode_rsd_->Value() < options_.low_encode_time_rsd_threshold);
    598     }
    599     underusing = encode_usage_underuse && encode_rsd_underuse;
    600   }
    601   return underusing;
    602 }
    603 }  // namespace webrtc
    604