Home | History | Annotate | Download | only in base
      1 /*
      2  *  Copyright 2010 The WebRTC Project Authors. All rights reserved.
      3  *
      4  *  Use of this source code is governed by a BSD-style license
      5  *  that can be found in the LICENSE file in the root of the source
      6  *  tree. An additional intellectual property rights grant can be found
      7  *  in the file PATENTS.  All contributing project authors may
      8  *  be found in the AUTHORS file in the root of the source tree.
      9  */
     10 
     11 #include "webrtc/base/cpumonitor.h"
     12 
     13 #include <string>
     14 
     15 #include "webrtc/base/common.h"
     16 #include "webrtc/base/logging.h"
     17 #include "webrtc/base/scoped_ptr.h"
     18 #include "webrtc/base/systeminfo.h"
     19 #include "webrtc/base/thread.h"
     20 #include "webrtc/base/timeutils.h"
     21 
     22 #if defined(WEBRTC_WIN)
     23 #include "webrtc/base/win32.h"
     24 #include <winternl.h>
     25 #endif
     26 
     27 #if defined(WEBRTC_POSIX)
     28 #include <sys/time.h>
     29 #endif
     30 
     31 #if defined(WEBRTC_MAC)
     32 #include <mach/mach_host.h>
     33 #include <mach/mach_init.h>
     34 #include <mach/mach_port.h>
     35 #include <mach/host_info.h>
     36 #include <mach/task.h>
     37 #endif  // defined(WEBRTC_MAC)
     38 
     39 #if defined(WEBRTC_LINUX)
     40 #include <sys/resource.h>
     41 #include <errno.h>
     42 #include <stdio.h>
     43 #include "webrtc/base/fileutils.h"
     44 #include "webrtc/base/pathutils.h"
     45 #endif // defined(WEBRTC_LINUX)
     46 
     47 #if defined(WEBRTC_MAC)
     48 static uint64 TimeValueTToInt64(const time_value_t &time_value) {
     49   return rtc::kNumMicrosecsPerSec * time_value.seconds +
     50       time_value.microseconds;
     51 }
     52 #endif  // defined(WEBRTC_MAC)
     53 
     54 // How CpuSampler works
     55 // When threads switch, the time they spent is accumulated to system counters.
     56 // The time can be treated as user, kernel or idle.
     57 // user time is applications.
     58 // kernel time is the OS, including the thread switching code itself.
     59 //   typically kernel time indicates IO.
     60 // idle time is a process that wastes time when nothing is ready to run.
     61 //
     62 // User time is broken down by process (application).  One of the applications
     63 // is the current process.  When you add up all application times, this is
     64 // system time.  If only your application is running, system time should be the
     65 // same as process time.
     66 //
     67 // All cores contribute to these accumulators.  A dual core process is able to
     68 // process twice as many cycles as a single core.  The actual code efficiency
     69 // may be worse, due to contention, but the available cycles is exactly twice
     70 // as many, and the cpu load will reflect the efficiency.  Hyperthreads behave
     71 // the same way.  The load will reflect 200%, but the actual amount of work
     72 // completed will be much less than a true dual core.
     73 //
     74 // Total available performance is the sum of all accumulators.
     75 // If you tracked this for 1 second, it would essentially give you the clock
     76 // rate - number of cycles per second.
     77 // Speed step / Turbo Boost is not considered, so infact more processing time
     78 // may be available.
     79 
     80 namespace rtc {
     81 
     82 // Note Tests on Windows show 600 ms is minimum stable interval for Windows 7.
     83 static const int32 kDefaultInterval = 950;  // Slightly under 1 second.
     84 
     85 CpuSampler::CpuSampler()
     86     : min_load_interval_(kDefaultInterval)
     87 #if defined(WEBRTC_WIN)
     88       , get_system_times_(NULL),
     89       nt_query_system_information_(NULL),
     90       force_fallback_(false)
     91 #endif
     92     {
     93 }
     94 
     95 CpuSampler::~CpuSampler() {
     96 }
     97 
     98 // Set minimum interval in ms between computing new load values. Default 950.
     99 void CpuSampler::set_load_interval(int min_load_interval) {
    100   min_load_interval_ = min_load_interval;
    101 }
    102 
    103 bool CpuSampler::Init() {
    104   sysinfo_.reset(new SystemInfo);
    105   cpus_ = sysinfo_->GetMaxCpus();
    106   if (cpus_ == 0) {
    107     return false;
    108   }
    109 #if defined(WEBRTC_WIN)
    110   // Note that GetSystemTimes is available in Windows XP SP1 or later.
    111   // http://msdn.microsoft.com/en-us/library/ms724400.aspx
    112   // NtQuerySystemInformation is used as a fallback.
    113   if (!force_fallback_) {
    114     get_system_times_ = GetProcAddress(GetModuleHandle(L"kernel32.dll"),
    115         "GetSystemTimes");
    116   }
    117   nt_query_system_information_ = GetProcAddress(GetModuleHandle(L"ntdll.dll"),
    118       "NtQuerySystemInformation");
    119   if ((get_system_times_ == NULL) && (nt_query_system_information_ == NULL)) {
    120     return false;
    121   }
    122 #endif
    123 #if defined(WEBRTC_LINUX)
    124   Pathname sname("/proc/stat");
    125   sfile_.reset(Filesystem::OpenFile(sname, "rb"));
    126   if (!sfile_) {
    127     LOG_ERR(LS_ERROR) << "open proc/stat failed:";
    128     return false;
    129   }
    130   if (!sfile_->DisableBuffering()) {
    131     LOG_ERR(LS_ERROR) << "could not disable buffering for proc/stat";
    132     return false;
    133   }
    134 #endif // defined(WEBRTC_LINUX)
    135   GetProcessLoad();  // Initialize values.
    136   GetSystemLoad();
    137   // Help next user call return valid data by recomputing load.
    138   process_.prev_load_time_ = 0u;
    139   system_.prev_load_time_ = 0u;
    140   return true;
    141 }
    142 
    143 float CpuSampler::UpdateCpuLoad(uint64 current_total_times,
    144                                 uint64 current_cpu_times,
    145                                 uint64 *prev_total_times,
    146                                 uint64 *prev_cpu_times) {
    147   float result = 0.f;
    148   if (current_total_times < *prev_total_times ||
    149       current_cpu_times < *prev_cpu_times) {
    150     LOG(LS_ERROR) << "Inconsistent time values are passed. ignored";
    151   } else {
    152     const uint64 cpu_diff = current_cpu_times - *prev_cpu_times;
    153     const uint64 total_diff = current_total_times - *prev_total_times;
    154     result = (total_diff == 0ULL ? 0.f :
    155               static_cast<float>(1.0f * cpu_diff / total_diff));
    156     if (result > static_cast<float>(cpus_)) {
    157       result = static_cast<float>(cpus_);
    158     }
    159     *prev_total_times = current_total_times;
    160     *prev_cpu_times = current_cpu_times;
    161   }
    162   return result;
    163 }
    164 
    165 float CpuSampler::GetSystemLoad() {
    166   uint32 timenow = Time();
    167   int elapsed = static_cast<int>(TimeDiff(timenow, system_.prev_load_time_));
    168   if (min_load_interval_ != 0 && system_.prev_load_time_ != 0u &&
    169       elapsed < min_load_interval_) {
    170     return system_.prev_load_;
    171   }
    172 #if defined(WEBRTC_WIN)
    173   uint64 total_times, cpu_times;
    174 
    175   typedef BOOL (_stdcall *GST_PROC)(LPFILETIME, LPFILETIME, LPFILETIME);
    176   typedef NTSTATUS (WINAPI *QSI_PROC)(SYSTEM_INFORMATION_CLASS,
    177       PVOID, ULONG, PULONG);
    178 
    179   GST_PROC get_system_times = reinterpret_cast<GST_PROC>(get_system_times_);
    180   QSI_PROC nt_query_system_information = reinterpret_cast<QSI_PROC>(
    181       nt_query_system_information_);
    182 
    183   if (get_system_times) {
    184     FILETIME idle_time, kernel_time, user_time;
    185     if (!get_system_times(&idle_time, &kernel_time, &user_time)) {
    186       LOG(LS_ERROR) << "::GetSystemTimes() failed: " << ::GetLastError();
    187       return 0.f;
    188     }
    189     // kernel_time includes Kernel idle time, so no need to
    190     // include cpu_time as total_times
    191     total_times = ToUInt64(kernel_time) + ToUInt64(user_time);
    192     cpu_times = total_times - ToUInt64(idle_time);
    193 
    194   } else {
    195     if (nt_query_system_information) {
    196       ULONG returned_length = 0;
    197       scoped_ptr<SYSTEM_PROCESSOR_PERFORMANCE_INFORMATION[]> processor_info(
    198           new SYSTEM_PROCESSOR_PERFORMANCE_INFORMATION[cpus_]);
    199       nt_query_system_information(
    200           ::SystemProcessorPerformanceInformation,
    201           reinterpret_cast<void*>(processor_info.get()),
    202           cpus_ * sizeof(SYSTEM_PROCESSOR_PERFORMANCE_INFORMATION),
    203           &returned_length);
    204 
    205       if (returned_length !=
    206           (cpus_ * sizeof(SYSTEM_PROCESSOR_PERFORMANCE_INFORMATION))) {
    207         LOG(LS_ERROR) << "NtQuerySystemInformation has unexpected size";
    208         return 0.f;
    209       }
    210 
    211       uint64 current_idle = 0;
    212       uint64 current_kernel = 0;
    213       uint64 current_user = 0;
    214       for (int ix = 0; ix < cpus_; ++ix) {
    215         current_idle += processor_info[ix].IdleTime.QuadPart;
    216         current_kernel += processor_info[ix].UserTime.QuadPart;
    217         current_user += processor_info[ix].KernelTime.QuadPart;
    218       }
    219       total_times = current_kernel + current_user;
    220       cpu_times = total_times - current_idle;
    221     } else {
    222       return 0.f;
    223     }
    224   }
    225 #endif  // WEBRTC_WIN
    226 
    227 #if defined(WEBRTC_MAC)
    228   mach_port_t mach_host = mach_host_self();
    229   host_cpu_load_info_data_t cpu_info;
    230   mach_msg_type_number_t info_count = HOST_CPU_LOAD_INFO_COUNT;
    231   kern_return_t kr = host_statistics(mach_host, HOST_CPU_LOAD_INFO,
    232                                      reinterpret_cast<host_info_t>(&cpu_info),
    233                                      &info_count);
    234   mach_port_deallocate(mach_task_self(), mach_host);
    235   if (KERN_SUCCESS != kr) {
    236     LOG(LS_ERROR) << "::host_statistics() failed";
    237     return 0.f;
    238   }
    239 
    240   const uint64 cpu_times = cpu_info.cpu_ticks[CPU_STATE_NICE] +
    241       cpu_info.cpu_ticks[CPU_STATE_SYSTEM] +
    242       cpu_info.cpu_ticks[CPU_STATE_USER];
    243   const uint64 total_times = cpu_times + cpu_info.cpu_ticks[CPU_STATE_IDLE];
    244 #endif  // defined(WEBRTC_MAC)
    245 
    246 #if defined(WEBRTC_LINUX)
    247   if (!sfile_) {
    248     LOG(LS_ERROR) << "Invalid handle for proc/stat";
    249     return 0.f;
    250   }
    251   std::string statbuf;
    252   sfile_->SetPosition(0);
    253   if (!sfile_->ReadLine(&statbuf)) {
    254     LOG_ERR(LS_ERROR) << "Could not read proc/stat file";
    255     return 0.f;
    256   }
    257 
    258   unsigned long long user;
    259   unsigned long long nice;
    260   unsigned long long system;
    261   unsigned long long idle;
    262   if (sscanf(statbuf.c_str(), "cpu %Lu %Lu %Lu %Lu",
    263              &user, &nice,
    264              &system, &idle) != 4) {
    265     LOG_ERR(LS_ERROR) << "Could not parse cpu info";
    266     return 0.f;
    267   }
    268   const uint64 cpu_times = nice + system + user;
    269   const uint64 total_times = cpu_times + idle;
    270 #endif  // defined(WEBRTC_LINUX)
    271 
    272 #if defined(__native_client__)
    273   // TODO(ryanpetrie): Implement this via PPAPI when it's available.
    274   const uint64 cpu_times = 0;
    275   const uint64 total_times = 0;
    276 #endif  // defined(__native_client__)
    277 
    278   system_.prev_load_time_ = timenow;
    279   system_.prev_load_ = UpdateCpuLoad(total_times,
    280                                      cpu_times * cpus_,
    281                                      &system_.prev_total_times_,
    282                                      &system_.prev_cpu_times_);
    283   return system_.prev_load_;
    284 }
    285 
    286 float CpuSampler::GetProcessLoad() {
    287   uint32 timenow = Time();
    288   int elapsed = static_cast<int>(TimeDiff(timenow, process_.prev_load_time_));
    289   if (min_load_interval_ != 0 && process_.prev_load_time_ != 0u &&
    290       elapsed < min_load_interval_) {
    291     return process_.prev_load_;
    292   }
    293 #if defined(WEBRTC_WIN)
    294   FILETIME current_file_time;
    295   ::GetSystemTimeAsFileTime(&current_file_time);
    296 
    297   FILETIME create_time, exit_time, kernel_time, user_time;
    298   if (!::GetProcessTimes(::GetCurrentProcess(),
    299                          &create_time, &exit_time, &kernel_time, &user_time)) {
    300     LOG(LS_ERROR) << "::GetProcessTimes() failed: " << ::GetLastError();
    301     return 0.f;
    302   }
    303 
    304   const uint64 total_times =
    305       ToUInt64(current_file_time) - ToUInt64(create_time);
    306   const uint64 cpu_times =
    307       (ToUInt64(kernel_time) + ToUInt64(user_time));
    308 #endif  // WEBRTC_WIN
    309 
    310 #if defined(WEBRTC_POSIX)
    311   // Common to both OSX and Linux.
    312   struct timeval tv;
    313   gettimeofday(&tv, NULL);
    314   const uint64 total_times = tv.tv_sec * kNumMicrosecsPerSec + tv.tv_usec;
    315 #endif
    316 
    317 #if defined(WEBRTC_MAC)
    318   // Get live thread usage.
    319   task_thread_times_info task_times_info;
    320   mach_msg_type_number_t info_count = TASK_THREAD_TIMES_INFO_COUNT;
    321 
    322   if (KERN_SUCCESS != task_info(mach_task_self(), TASK_THREAD_TIMES_INFO,
    323                                 reinterpret_cast<task_info_t>(&task_times_info),
    324                                 &info_count)) {
    325     LOG(LS_ERROR) << "::task_info(TASK_THREAD_TIMES_INFO) failed";
    326     return 0.f;
    327   }
    328 
    329   // Get terminated thread usage.
    330   task_basic_info task_term_info;
    331   info_count = TASK_BASIC_INFO_COUNT;
    332   if (KERN_SUCCESS != task_info(mach_task_self(), TASK_BASIC_INFO,
    333                                 reinterpret_cast<task_info_t>(&task_term_info),
    334                                 &info_count)) {
    335     LOG(LS_ERROR) << "::task_info(TASK_BASIC_INFO) failed";
    336     return 0.f;
    337   }
    338 
    339   const uint64 cpu_times = (TimeValueTToInt64(task_times_info.user_time) +
    340       TimeValueTToInt64(task_times_info.system_time) +
    341       TimeValueTToInt64(task_term_info.user_time) +
    342       TimeValueTToInt64(task_term_info.system_time));
    343 #endif  // defined(WEBRTC_MAC)
    344 
    345 #if defined(WEBRTC_LINUX)
    346   rusage usage;
    347   if (getrusage(RUSAGE_SELF, &usage) < 0) {
    348     LOG_ERR(LS_ERROR) << "getrusage failed";
    349     return 0.f;
    350   }
    351 
    352   const uint64 cpu_times =
    353       (usage.ru_utime.tv_sec + usage.ru_stime.tv_sec) * kNumMicrosecsPerSec +
    354       usage.ru_utime.tv_usec + usage.ru_stime.tv_usec;
    355 #endif  // defined(WEBRTC_LINUX)
    356 
    357 #if defined(__native_client__)
    358   // TODO(ryanpetrie): Implement this via PPAPI when it's available.
    359   const uint64 cpu_times = 0;
    360 #endif  // defined(__native_client__)
    361 
    362   process_.prev_load_time_ = timenow;
    363   process_.prev_load_ = UpdateCpuLoad(total_times,
    364                                      cpu_times,
    365                                      &process_.prev_total_times_,
    366                                      &process_.prev_cpu_times_);
    367   return process_.prev_load_;
    368 }
    369 
    370 int CpuSampler::GetMaxCpus() const {
    371   return cpus_;
    372 }
    373 
    374 int CpuSampler::GetCurrentCpus() {
    375   return sysinfo_->GetCurCpus();
    376 }
    377 
    378 ///////////////////////////////////////////////////////////////////
    379 // Implementation of class CpuMonitor.
    380 CpuMonitor::CpuMonitor(Thread* thread)
    381     : monitor_thread_(thread) {
    382 }
    383 
    384 CpuMonitor::~CpuMonitor() {
    385   Stop();
    386 }
    387 
    388 void CpuMonitor::set_thread(Thread* thread) {
    389   ASSERT(monitor_thread_ == NULL || monitor_thread_ == thread);
    390   monitor_thread_ = thread;
    391 }
    392 
    393 bool CpuMonitor::Start(int period_ms) {
    394   if (!monitor_thread_  || !sampler_.Init()) return false;
    395 
    396   monitor_thread_->SignalQueueDestroyed.connect(
    397        this, &CpuMonitor::OnMessageQueueDestroyed);
    398 
    399   period_ms_ = period_ms;
    400   monitor_thread_->PostDelayed(period_ms_, this);
    401 
    402   return true;
    403 }
    404 
    405 void CpuMonitor::Stop() {
    406   if (monitor_thread_) {
    407     monitor_thread_->Clear(this);
    408   }
    409 }
    410 
    411 void CpuMonitor::OnMessage(Message* msg) {
    412   int max_cpus = sampler_.GetMaxCpus();
    413   int current_cpus = sampler_.GetCurrentCpus();
    414   float process_load = sampler_.GetProcessLoad();
    415   float system_load = sampler_.GetSystemLoad();
    416   SignalUpdate(current_cpus, max_cpus, process_load, system_load);
    417 
    418   if (monitor_thread_) {
    419     monitor_thread_->PostDelayed(period_ms_, this);
    420   }
    421 }
    422 
    423 }  // namespace rtc
    424