1 // Copyright 2013 The Chromium Authors. All rights reserved. 2 // Use of this source code is governed by a BSD-style license that can be 3 // found in the LICENSE file. 4 5 #ifndef CHROME_BROWSER_EXTENSIONS_ACTIVITY_LOG_ACTIVITY_LOG_POLICY_H_ 6 #define CHROME_BROWSER_EXTENSIONS_ACTIVITY_LOG_ACTIVITY_LOG_POLICY_H_ 7 8 #include <map> 9 #include <set> 10 #include <string> 11 #include <vector> 12 13 #include "base/bind.h" 14 #include "base/bind_helpers.h" 15 #include "base/callback.h" 16 #include "base/memory/scoped_ptr.h" 17 #include "base/values.h" 18 #include "chrome/browser/extensions/activity_log/activity_actions.h" 19 #include "chrome/browser/extensions/activity_log/activity_database.h" 20 #include "chrome/common/extensions/api/activity_log_private.h" 21 #include "content/public/browser/browser_thread.h" 22 #include "url/gurl.h" 23 24 class Profile; 25 class GURL; 26 27 namespace base { 28 class FilePath; 29 } 30 31 namespace extensions { 32 33 class Extension; 34 35 // An abstract class for processing and summarizing activity log data. 36 // Subclasses will generally store data in an SQLite database (the 37 // ActivityLogDatabasePolicy subclass includes some helper methods to assist 38 // with this case), but this is not absolutely required. 39 // 40 // Implementations should support: 41 // (1) Receiving Actions to process, and summarizing, compression, and storing 42 // these as appropriate. 43 // (2) Reading Actions back from storage. 44 // (3) Cleaning of URLs 45 // 46 // Implementations based on a database should likely implement 47 // ActivityDatabase::Delegate, which provides hooks on database events and 48 // allows the database to periodically request that actions (which the policy 49 // is responsible for queueing) be flushed to storage. 50 // 51 // Since every policy implementation might summarize data differently, the 52 // database implementation is policy-specific and therefore completely 53 // encapsulated in the policy class. All the member functions can be called 54 // on the UI thread. 55 class ActivityLogPolicy { 56 public: 57 enum PolicyType { 58 POLICY_FULLSTREAM, 59 POLICY_COUNTS, 60 POLICY_INVALID, 61 }; 62 63 // Parameters are the profile and the thread that will be used to execute 64 // the callback when ReadData is called. 65 // TODO(felt,dbabic) Since only ReadData uses thread_id, it would be 66 // cleaner to pass thread_id as a param of ReadData directly. 67 explicit ActivityLogPolicy(Profile* profile); 68 69 // Instead of a public destructor, ActivityLogPolicy objects have a Close() 70 // method which will cause the object to be deleted (but may do so on another 71 // thread or in a deferred fashion). 72 virtual void Close() = 0; 73 74 // Updates the internal state of the model summarizing actions and possibly 75 // writes to the database. Implements the default policy storing internal 76 // state to memory every 5 min. 77 virtual void ProcessAction(scoped_refptr<Action> action) = 0; 78 79 // For unit testing only. 80 void SetClockForTesting(scoped_ptr<base::Clock> clock); 81 82 // A collection of methods that are useful for implementing policies. These 83 // are all static methods; the ActivityLogPolicy::Util class cannot be 84 // instantiated. This is nested within ActivityLogPolicy to make calling 85 // these methods more convenient from within a policy, but they are public. 86 class Util { 87 public: 88 // A collection of API calls, used to specify whitelists for argument 89 // filtering. 90 typedef std::set<std::pair<Action::ActionType, std::string> > ApiSet; 91 92 // Serialize a Value as a JSON string. Returns an empty string if value is 93 // null. 94 static std::string Serialize(const base::Value* value); 95 96 // Removes potentially privacy-sensitive data that should not be logged. 97 // This should generally be called on an Action before logging, unless 98 // debugging flags are enabled. Modifies the Action object in place; if 99 // the action might be shared with other users, it is up to the caller to 100 // call ->Clone() first. 101 static void StripPrivacySensitiveFields(scoped_refptr<Action> action); 102 103 // Strip arguments from most API actions, preserving actions only for a 104 // whitelisted set. Modifies the Action object in-place. 105 static void StripArguments(const ApiSet& api_whitelist, 106 scoped_refptr<Action> action); 107 108 // Given a base day (timestamp at local midnight), computes the timestamp 109 // at midnight the given number of days before or after. 110 static base::Time AddDays(const base::Time& base_date, int days); 111 112 // Compute the time bounds that should be used for a database query to 113 // cover a time range days_ago days in the past, relative to the specified 114 // time. 115 static void ComputeDatabaseTimeBounds(const base::Time& now, 116 int days_ago, 117 int64* early_bound, 118 int64* late_bound); 119 120 // Deletes obsolete database tables from an activity log database. This 121 // can be used in InitDatabase() methods of ActivityLogDatabasePolicy 122 // subclasses to clean up data from old versions of the activity logging 123 // code. Returns true on success, false on database error. 124 static bool DropObsoleteTables(sql::Connection* db); 125 126 private: 127 DISALLOW_IMPLICIT_CONSTRUCTORS(Util); 128 }; 129 130 protected: 131 // An ActivityLogPolicy is not directly destroyed. Instead, call Close() 132 // which will cause the object to be deleted when it is safe. 133 virtual ~ActivityLogPolicy(); 134 135 // Returns Time::Now() unless a mock clock has been installed with 136 // SetClockForTesting, in which case the time according to that clock is used 137 // instead. 138 base::Time Now() const; 139 140 private: 141 // Support for a mock clock for testing purposes. This is used by ReadData 142 // to determine the date for "today" when when interpreting date ranges to 143 // fetch. This has no effect on batching of writes to the database. 144 scoped_ptr<base::Clock> testing_clock_; 145 146 DISALLOW_COPY_AND_ASSIGN(ActivityLogPolicy); 147 }; 148 149 // A subclass of ActivityLogPolicy which is designed for policies that use 150 // database storage; it contains several useful helper methods. 151 class ActivityLogDatabasePolicy : public ActivityLogPolicy, 152 public ActivityDatabase::Delegate { 153 public: 154 ActivityLogDatabasePolicy(Profile* profile, 155 const base::FilePath& database_name); 156 157 // Initializes an activity log policy database. This needs to be called after 158 // constructing ActivityLogDatabasePolicy. 159 void Init(); 160 161 // Requests that in-memory state be written to the database. This method can 162 // be called from any thread, but the database writes happen asynchronously 163 // on the database thread. 164 virtual void Flush(); 165 166 // Gets all actions that match the specified fields. URLs are treated like 167 // prefixes; other fields are exact matches. Empty strings are not matched to 168 // anything. For the date: 0 = today, 1 = yesterday, etc.; if the data is 169 // negative, it will be treated as missing. 170 virtual void ReadFilteredData( 171 const std::string& extension_id, 172 const Action::ActionType type, 173 const std::string& api_name, 174 const std::string& page_url, 175 const std::string& arg_url, 176 const int days_ago, 177 const base::Callback 178 <void(scoped_ptr<Action::ActionVector>)>& callback) = 0; 179 180 // Clean the relevant URL data. The cleaning may need to be different for 181 // different policies. If restrict_urls is empty then all URLs are removed. 182 virtual void RemoveURLs(const std::vector<GURL>& restrict_urls) = 0; 183 184 // Remove all rows relating to a given extension. 185 virtual void RemoveExtensionData(const std::string& extension_id) = 0; 186 187 // Deletes everything in the database. 188 virtual void DeleteDatabase() = 0; 189 190 protected: 191 // The Schedule methods dispatch the calls to the database on a 192 // separate thread. 193 template<typename DatabaseType, typename DatabaseFunc> 194 void ScheduleAndForget(DatabaseType db, DatabaseFunc func) { 195 content::BrowserThread::PostTask( 196 content::BrowserThread::DB, 197 FROM_HERE, 198 base::Bind(func, base::Unretained(db))); 199 } 200 201 template<typename DatabaseType, typename DatabaseFunc, typename ArgA> 202 void ScheduleAndForget(DatabaseType db, DatabaseFunc func, ArgA a) { 203 content::BrowserThread::PostTask( 204 content::BrowserThread::DB, 205 FROM_HERE, 206 base::Bind(func, base::Unretained(db), a)); 207 } 208 209 template<typename DatabaseType, typename DatabaseFunc, 210 typename ArgA, typename ArgB> 211 void ScheduleAndForget(DatabaseType db, DatabaseFunc func, ArgA a, ArgB b) { 212 content::BrowserThread::PostTask( 213 content::BrowserThread::DB, 214 FROM_HERE, 215 base::Bind(func, base::Unretained(db), a, b)); 216 } 217 218 // Access to the underlying ActivityDatabase. 219 ActivityDatabase* activity_database() const { return db_; } 220 221 // Access to the SQL connection in the ActivityDatabase. This should only be 222 // called from the database thread. May return NULL if the database is not 223 // valid. 224 sql::Connection* GetDatabaseConnection() const; 225 226 private: 227 // See the comments for the ActivityDatabase class for a discussion of how 228 // database cleanup runs. 229 ActivityDatabase* db_; 230 base::FilePath database_path_; 231 }; 232 233 } // namespace extensions 234 235 #endif // CHROME_BROWSER_EXTENSIONS_ACTIVITY_LOG_ACTIVITY_LOG_POLICY_H_ 236