1 # Copyright (c) 2009, Google Inc. All rights reserved. 2 # Copyright (c) 2009 Apple Inc. All rights reserved. 3 # 4 # Redistribution and use in source and binary forms, with or without 5 # modification, are permitted provided that the following conditions are 6 # met: 7 # 8 # * Redistributions of source code must retain the above copyright 9 # notice, this list of conditions and the following disclaimer. 10 # * Redistributions in binary form must reproduce the above 11 # copyright notice, this list of conditions and the following disclaimer 12 # in the documentation and/or other materials provided with the 13 # distribution. 14 # * Neither the name of Google Inc. nor the names of its 15 # contributors may be used to endorse or promote products derived from 16 # this software without specific prior written permission. 17 # 18 # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 19 # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 20 # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 21 # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 22 # OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 23 # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 24 # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 25 # DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 26 # THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 27 # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 28 # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 29 30 import errno 31 import logging 32 import multiprocessing 33 import os 34 import StringIO 35 import signal 36 import subprocess 37 import sys 38 import time 39 40 from webkitpy.common.system.outputtee import Tee 41 from webkitpy.common.system.filesystem import FileSystem 42 43 44 _log = logging.getLogger(__name__) 45 46 47 class ScriptError(Exception): 48 49 def __init__(self, 50 message=None, 51 script_args=None, 52 exit_code=None, 53 output=None, 54 cwd=None, 55 output_limit=500): 56 shortened_output = output 57 if output and output_limit and len(output) > output_limit: 58 shortened_output = "Last %s characters of output:\n%s" % (output_limit, output[-output_limit:]) 59 60 if not message: 61 message = 'Failed to run "%s"' % repr(script_args) 62 if exit_code: 63 message += " exit_code: %d" % exit_code 64 if cwd: 65 message += " cwd: %s" % cwd 66 67 if shortened_output: 68 message += "\n\noutput: %s" % shortened_output 69 70 Exception.__init__(self, message) 71 self.script_args = script_args # 'args' is already used by Exception 72 self.exit_code = exit_code 73 self.output = output 74 self.cwd = cwd 75 76 def message_with_output(self): 77 return unicode(self) 78 79 def command_name(self): 80 command_path = self.script_args 81 if type(command_path) is list: 82 command_path = command_path[0] 83 return os.path.basename(command_path) 84 85 86 class Executive(object): 87 PIPE = subprocess.PIPE 88 STDOUT = subprocess.STDOUT 89 90 def _should_close_fds(self): 91 # We need to pass close_fds=True to work around Python bug #2320 92 # (otherwise we can hang when we kill DumpRenderTree when we are running 93 # multiple threads). See http://bugs.python.org/issue2320 . 94 # Note that close_fds isn't supported on Windows, but this bug only 95 # shows up on Mac and Linux. 96 return sys.platform not in ('win32', 'cygwin') 97 98 def _run_command_with_teed_output(self, args, teed_output, **kwargs): 99 child_process = self.popen(args, 100 stdout=self.PIPE, 101 stderr=self.STDOUT, 102 close_fds=self._should_close_fds(), 103 **kwargs) 104 105 # Use our own custom wait loop because Popen ignores a tee'd 106 # stderr/stdout. 107 # FIXME: This could be improved not to flatten output to stdout. 108 while True: 109 output_line = child_process.stdout.readline() 110 if output_line == "" and child_process.poll() != None: 111 # poll() is not threadsafe and can throw OSError due to: 112 # http://bugs.python.org/issue1731717 113 return child_process.poll() 114 # We assume that the child process wrote to us in utf-8, 115 # so no re-encoding is necessary before writing here. 116 teed_output.write(output_line) 117 118 # FIXME: Remove this deprecated method and move callers to run_command. 119 # FIXME: This method is a hack to allow running command which both 120 # capture their output and print out to stdin. Useful for things 121 # like "build-webkit" where we want to display to the user that we're building 122 # but still have the output to stuff into a log file. 123 def run_and_throw_if_fail(self, args, quiet=False, decode_output=True, **kwargs): 124 # Cache the child's output locally so it can be used for error reports. 125 child_out_file = StringIO.StringIO() 126 tee_stdout = sys.stdout 127 if quiet: 128 dev_null = open(os.devnull, "w") # FIXME: Does this need an encoding? 129 tee_stdout = dev_null 130 child_stdout = Tee(child_out_file, tee_stdout) 131 exit_code = self._run_command_with_teed_output(args, child_stdout, **kwargs) 132 if quiet: 133 dev_null.close() 134 135 child_output = child_out_file.getvalue() 136 child_out_file.close() 137 138 if decode_output: 139 child_output = child_output.decode(self._child_process_encoding()) 140 141 if exit_code: 142 raise ScriptError(script_args=args, 143 exit_code=exit_code, 144 output=child_output) 145 return child_output 146 147 def cpu_count(self): 148 return multiprocessing.cpu_count() 149 150 @staticmethod 151 def interpreter_for_script(script_path, fs=None): 152 fs = fs or FileSystem() 153 lines = fs.read_text_file(script_path).splitlines() 154 if not len(lines): 155 return None 156 first_line = lines[0] 157 if not first_line.startswith('#!'): 158 return None 159 if first_line.find('python') > -1: 160 return sys.executable 161 if first_line.find('perl') > -1: 162 return 'perl' 163 if first_line.find('ruby') > -1: 164 return 'ruby' 165 return None 166 167 @staticmethod 168 def shell_command_for_script(script_path, fs=None): 169 fs = fs or FileSystem() 170 # Win32 does not support shebang. We need to detect the interpreter ourself. 171 if sys.platform == 'win32': 172 interpreter = Executive.interpreter_for_script(script_path, fs) 173 if interpreter: 174 return [interpreter, script_path] 175 return [script_path] 176 177 def kill_process(self, pid): 178 """Attempts to kill the given pid. 179 Will fail silently if pid does not exist or insufficient permisssions.""" 180 if sys.platform == "win32": 181 # We only use taskkill.exe on windows (not cygwin) because subprocess.pid 182 # is a CYGWIN pid and taskkill.exe expects a windows pid. 183 # Thankfully os.kill on CYGWIN handles either pid type. 184 command = ["taskkill.exe", "/f", "/pid", pid] 185 # taskkill will exit 128 if the process is not found. We should log. 186 self.run_command(command, error_handler=self.ignore_error) 187 return 188 189 # According to http://docs.python.org/library/os.html 190 # os.kill isn't available on Windows. python 2.5.5 os.kill appears 191 # to work in cygwin, however it occasionally raises EAGAIN. 192 retries_left = 10 if sys.platform == "cygwin" else 1 193 while retries_left > 0: 194 try: 195 retries_left -= 1 196 os.kill(pid, signal.SIGKILL) 197 _ = os.waitpid(pid, os.WNOHANG) 198 except OSError, e: 199 if e.errno == errno.EAGAIN: 200 if retries_left <= 0: 201 _log.warn("Failed to kill pid %s. Too many EAGAIN errors." % pid) 202 continue 203 if e.errno == errno.ESRCH: # The process does not exist. 204 return 205 if e.errno == errno.EPIPE: # The process has exited already on cygwin 206 return 207 if e.errno == errno.ECHILD: 208 # Can't wait on a non-child process, but the kill worked. 209 return 210 if e.errno == errno.EACCES and sys.platform == 'cygwin': 211 # Cygwin python sometimes can't kill native processes. 212 return 213 raise 214 215 def _win32_check_running_pid(self, pid): 216 # importing ctypes at the top-level seems to cause weird crashes at 217 # exit under cygwin on apple's win port. Only win32 needs cygwin, so 218 # we import it here instead. See https://bugs.webkit.org/show_bug.cgi?id=91682 219 import ctypes 220 221 class PROCESSENTRY32(ctypes.Structure): 222 _fields_ = [("dwSize", ctypes.c_ulong), 223 ("cntUsage", ctypes.c_ulong), 224 ("th32ProcessID", ctypes.c_ulong), 225 ("th32DefaultHeapID", ctypes.POINTER(ctypes.c_ulong)), 226 ("th32ModuleID", ctypes.c_ulong), 227 ("cntThreads", ctypes.c_ulong), 228 ("th32ParentProcessID", ctypes.c_ulong), 229 ("pcPriClassBase", ctypes.c_ulong), 230 ("dwFlags", ctypes.c_ulong), 231 ("szExeFile", ctypes.c_char * 260)] 232 233 CreateToolhelp32Snapshot = ctypes.windll.kernel32.CreateToolhelp32Snapshot 234 Process32First = ctypes.windll.kernel32.Process32First 235 Process32Next = ctypes.windll.kernel32.Process32Next 236 CloseHandle = ctypes.windll.kernel32.CloseHandle 237 TH32CS_SNAPPROCESS = 0x00000002 # win32 magic number 238 hProcessSnap = CreateToolhelp32Snapshot(TH32CS_SNAPPROCESS, 0) 239 pe32 = PROCESSENTRY32() 240 pe32.dwSize = ctypes.sizeof(PROCESSENTRY32) 241 result = False 242 if not Process32First(hProcessSnap, ctypes.byref(pe32)): 243 _log.debug("Failed getting first process.") 244 CloseHandle(hProcessSnap) 245 return result 246 while True: 247 if pe32.th32ProcessID == pid: 248 result = True 249 break 250 if not Process32Next(hProcessSnap, ctypes.byref(pe32)): 251 break 252 CloseHandle(hProcessSnap) 253 return result 254 255 def check_running_pid(self, pid): 256 """Return True if pid is alive, otherwise return False.""" 257 if sys.platform == 'win32': 258 return self._win32_check_running_pid(pid) 259 260 try: 261 os.kill(pid, 0) 262 return True 263 except OSError: 264 return False 265 266 def running_pids(self, process_name_filter=None): 267 if not process_name_filter: 268 process_name_filter = lambda process_name: True 269 270 running_pids = [] 271 272 if sys.platform in ("win32", "cygwin"): 273 # FIXME: running_pids isn't implemented on Windows yet... 274 return [] 275 276 ps_process = self.popen(['ps', '-eo', 'pid,comm'], stdout=self.PIPE, stderr=self.PIPE) 277 stdout, _ = ps_process.communicate() 278 for line in stdout.splitlines(): 279 try: 280 # In some cases the line can contain one or more 281 # leading white-spaces, so strip it before split. 282 pid, process_name = line.strip().split(' ', 1) 283 if process_name_filter(process_name): 284 running_pids.append(int(pid)) 285 except ValueError, e: 286 pass 287 288 return sorted(running_pids) 289 290 def wait_newest(self, process_name_filter=None): 291 if not process_name_filter: 292 process_name_filter = lambda process_name: True 293 294 running_pids = self.running_pids(process_name_filter) 295 if not running_pids: 296 return 297 pid = running_pids[-1] 298 299 while self.check_running_pid(pid): 300 time.sleep(0.25) 301 302 def wait_limited(self, pid, limit_in_seconds=None, check_frequency_in_seconds=None): 303 seconds_left = limit_in_seconds or 10 304 sleep_length = check_frequency_in_seconds or 1 305 while seconds_left > 0 and self.check_running_pid(pid): 306 seconds_left -= sleep_length 307 time.sleep(sleep_length) 308 309 def _windows_image_name(self, process_name): 310 name, extension = os.path.splitext(process_name) 311 if not extension: 312 # taskkill expects processes to end in .exe 313 # If necessary we could add a flag to disable appending .exe. 314 process_name = "%s.exe" % name 315 return process_name 316 317 def interrupt(self, pid): 318 interrupt_signal = signal.SIGINT 319 # FIXME: The python docs seem to imply that platform == 'win32' may need to use signal.CTRL_C_EVENT 320 # http://docs.python.org/2/library/signal.html 321 try: 322 os.kill(pid, interrupt_signal) 323 except OSError: 324 # Silently ignore when the pid doesn't exist. 325 # It's impossible for callers to avoid race conditions with process shutdown. 326 pass 327 328 def kill_all(self, process_name): 329 """Attempts to kill processes matching process_name. 330 Will fail silently if no process are found.""" 331 if sys.platform in ("win32", "cygwin"): 332 image_name = self._windows_image_name(process_name) 333 command = ["taskkill.exe", "/f", "/im", image_name] 334 # taskkill will exit 128 if the process is not found. We should log. 335 self.run_command(command, error_handler=self.ignore_error) 336 return 337 338 # FIXME: This is inconsistent that kill_all uses TERM and kill_process 339 # uses KILL. Windows is always using /f (which seems like -KILL). 340 # We should pick one mode, or add support for switching between them. 341 # Note: Mac OS X 10.6 requires -SIGNALNAME before -u USER 342 command = ["killall", "-TERM", "-u", os.getenv("USER"), process_name] 343 # killall returns 1 if no process can be found and 2 on command error. 344 # FIXME: We should pass a custom error_handler to allow only exit_code 1. 345 # We should log in exit_code == 1 346 self.run_command(command, error_handler=self.ignore_error) 347 348 # Error handlers do not need to be static methods once all callers are 349 # updated to use an Executive object. 350 351 @staticmethod 352 def default_error_handler(error): 353 raise error 354 355 @staticmethod 356 def ignore_error(error): 357 pass 358 359 def _compute_stdin(self, input): 360 """Returns (stdin, string_to_communicate)""" 361 # FIXME: We should be returning /dev/null for stdin 362 # or closing stdin after process creation to prevent 363 # child processes from getting input from the user. 364 if not input: 365 return (None, None) 366 if hasattr(input, "read"): # Check if the input is a file. 367 return (input, None) # Assume the file is in the right encoding. 368 369 # Popen in Python 2.5 and before does not automatically encode unicode objects. 370 # http://bugs.python.org/issue5290 371 # See https://bugs.webkit.org/show_bug.cgi?id=37528 372 # for an example of a regresion caused by passing a unicode string directly. 373 # FIXME: We may need to encode differently on different platforms. 374 if isinstance(input, unicode): 375 input = input.encode(self._child_process_encoding()) 376 return (self.PIPE, input) 377 378 def command_for_printing(self, args): 379 """Returns a print-ready string representing command args. 380 The string should be copy/paste ready for execution in a shell.""" 381 args = self._stringify_args(args) 382 escaped_args = [] 383 for arg in args: 384 if isinstance(arg, unicode): 385 # Escape any non-ascii characters for easy copy/paste 386 arg = arg.encode("unicode_escape") 387 # FIXME: Do we need to fix quotes here? 388 escaped_args.append(arg) 389 return " ".join(escaped_args) 390 391 # FIXME: run_and_throw_if_fail should be merged into this method. 392 def run_command(self, 393 args, 394 cwd=None, 395 env=None, 396 input=None, 397 error_handler=None, 398 return_exit_code=False, 399 return_stderr=True, 400 decode_output=True, debug_logging=True): 401 """Popen wrapper for convenience and to work around python bugs.""" 402 assert(isinstance(args, list) or isinstance(args, tuple)) 403 start_time = time.time() 404 405 stdin, string_to_communicate = self._compute_stdin(input) 406 stderr = self.STDOUT if return_stderr else None 407 408 process = self.popen(args, 409 stdin=stdin, 410 stdout=self.PIPE, 411 stderr=stderr, 412 cwd=cwd, 413 env=env, 414 close_fds=self._should_close_fds()) 415 output = process.communicate(string_to_communicate)[0] 416 417 # run_command automatically decodes to unicode() unless explicitly told not to. 418 if decode_output: 419 output = output.decode(self._child_process_encoding()) 420 421 # wait() is not threadsafe and can throw OSError due to: 422 # http://bugs.python.org/issue1731717 423 exit_code = process.wait() 424 425 if debug_logging: 426 _log.debug('"%s" took %.2fs' % (self.command_for_printing(args), time.time() - start_time)) 427 428 if return_exit_code: 429 return exit_code 430 431 if exit_code: 432 script_error = ScriptError(script_args=args, 433 exit_code=exit_code, 434 output=output, 435 cwd=cwd) 436 (error_handler or self.default_error_handler)(script_error) 437 return output 438 439 def _child_process_encoding(self): 440 # Win32 Python 2.x uses CreateProcessA rather than CreateProcessW 441 # to launch subprocesses, so we have to encode arguments using the 442 # current code page. 443 if sys.platform == 'win32' and sys.version < '3': 444 return 'mbcs' 445 # All other platforms use UTF-8. 446 # FIXME: Using UTF-8 on Cygwin will confuse Windows-native commands 447 # which will expect arguments to be encoded using the current code 448 # page. 449 return 'utf-8' 450 451 def _should_encode_child_process_arguments(self): 452 # Cygwin's Python's os.execv doesn't support unicode command 453 # arguments, and neither does Cygwin's execv itself. 454 if sys.platform == 'cygwin': 455 return True 456 457 # Win32 Python 2.x uses CreateProcessA rather than CreateProcessW 458 # to launch subprocesses, so we have to encode arguments using the 459 # current code page. 460 if sys.platform == 'win32' and sys.version < '3': 461 return True 462 463 return False 464 465 def _encode_argument_if_needed(self, argument): 466 if not self._should_encode_child_process_arguments(): 467 return argument 468 return argument.encode(self._child_process_encoding()) 469 470 def _stringify_args(self, args): 471 # Popen will throw an exception if args are non-strings (like int()) 472 string_args = map(unicode, args) 473 # The Windows implementation of Popen cannot handle unicode strings. :( 474 return map(self._encode_argument_if_needed, string_args) 475 476 # The only required arugment to popen is named "args", the rest are optional keyword arguments. 477 def popen(self, args, **kwargs): 478 # FIXME: We should always be stringifying the args, but callers who pass shell=True 479 # expect that the exact bytes passed will get passed to the shell (even if they're wrongly encoded). 480 # shell=True is wrong for many other reasons, and we should remove this 481 # hack as soon as we can fix all callers to not use shell=True. 482 if kwargs.get('shell') == True: 483 string_args = args 484 else: 485 string_args = self._stringify_args(args) 486 return subprocess.Popen(string_args, **kwargs) 487 488 def call(self, args, **kwargs): 489 return subprocess.call(self._stringify_args(args), **kwargs) 490 491 def run_in_parallel(self, command_lines_and_cwds, processes=None): 492 """Runs a list of (cmd_line list, cwd string) tuples in parallel and returns a list of (retcode, stdout, stderr) tuples.""" 493 assert len(command_lines_and_cwds) 494 495 if sys.platform in ('cygwin', 'win32'): 496 return map(_run_command_thunk, command_lines_and_cwds) 497 pool = multiprocessing.Pool(processes=processes) 498 results = pool.map(_run_command_thunk, command_lines_and_cwds) 499 pool.close() 500 pool.join() 501 return results 502 503 504 def _run_command_thunk(cmd_line_and_cwd): 505 # Note that this needs to be a bare module (and hence Picklable) method to work with multiprocessing.Pool. 506 (cmd_line, cwd) = cmd_line_and_cwd 507 proc = subprocess.Popen(cmd_line, cwd=cwd, stdout=subprocess.PIPE, stderr=subprocess.PIPE) 508 stdout, stderr = proc.communicate() 509 return (proc.returncode, stdout, stderr) 510