Home | History | Annotate | Download | only in commands
      1 # Copyright (c) 2011 The Chromium Authors. All rights reserved.
      2 # Use of this source code is governed by a BSD-style license that can be
      3 # found in the LICENSE file.
      4 
      5 """Command for scraping images from a URL or list of URLs.
      6 
      7 Prerequisites:
      8   1. The command_line package from tools/site_compare
      9   2. Either the IE BHO or Firefox extension (or both)
     10 
     11 Installation:
     12   1. Build the IE BHO, or call regsvr32 on a prebuilt binary
     13   2. Add a file called "measurepageloadtimeextension@google.com" to
     14      the default Firefox profile directory under extensions, containing
     15      the path to the Firefox extension root
     16 
     17 Invoke with the command line arguments as documented within
     18 the command line.
     19 """
     20 
     21 import command_line
     22 
     23 from drivers import windowing
     24 from utils import browser_iterate
     25 
     26 def CreateCommand(cmdline):
     27   """Inserts the command and arguments into a command line for parsing."""
     28   cmd = cmdline.AddCommand(
     29     ["scrape"],
     30     "Scrapes an image from a URL or series of URLs.",
     31     None,
     32     ExecuteScrape)
     33 
     34   browser_iterate.SetupIterationCommandLine(cmd)
     35   cmd.AddArgument(
     36     ["-log", "--logfile"], "File to write text output", type="string")
     37   cmd.AddArgument(
     38     ["-out", "--outdir"], "Directory to store scrapes", type="string", required=True)
     39 
     40 
     41 def ExecuteScrape(command):
     42   """Executes the Scrape command."""
     43 
     44   def ScrapeResult(url, proc, wnd, result):
     45     """Capture and save the scrape."""
     46     if log_file: log_file.write(result)
     47 
     48     # Scrape the page
     49     image = windowing.ScrapeWindow(wnd)
     50     filename = windowing.URLtoFilename(url, command["--outdir"], ".bmp")
     51     image.save(filename)
     52 
     53   if command["--logfile"]: log_file = open(command["--logfile"], "w")
     54   else: log_file = None
     55 
     56   browser_iterate.Iterate(command, ScrapeResult)
     57 
     58   # Close the log file and return. We're done.
     59   if log_file: log_file.close()
     60