1 # Copyright 2016 The Chromium OS Authors. All rights reserved. 2 # Use of this source code is governed by a BSD-style license that can be 3 # found in the LICENSE file. 4 5 """This module provides the utilities for avsync_probe's data processing. 6 7 We will get a lot of raw data from the avsync_probe.Capture(). One data per 8 millisecond. 9 AVSyncProbeDataParser will help to transform the raw data to more readable 10 formats. It also helps to calculate the audio/video sync timing if the 11 sound_interval_frames parameter is not None. 12 13 Example: 14 capture_data = avsync_probe.Capture(12) 15 parser = avsync_probe_utils.AVSyncProbeDataParser(self.resultsdir, 16 capture_data, 30) 17 18 # Use the following attributes to access data. They can be referenced in 19 # AVSyncProbeDataParser Class. 20 parser.video_duration_average 21 parser.video_duration_std 22 parser.sync_duration_averag 23 parser.sync_duration_std 24 parser.cumulative_frame_count 25 parser.dropped_frame_count 26 parser.corrupted_frame_count 27 parser.binarize_data 28 parser.audio_events 29 parser.video_events 30 31 """ 32 33 import collections 34 import logging 35 import math 36 import os 37 import sys 38 39 40 # Indices for binarize_data, audio_events and video_events. 41 TIME_INDEX = 0 42 VIDEO_INDEX = 1 43 AUDIO_INDEX = 2 44 # This index is used for video_events and audio_events. 45 # The slot contains the time difference to the previous event. 46 TIME_DIFF_INDEX = 3 47 48 # SyncResult namedtuple of audio and video frame. 49 # time_delay < 0 means that audio comes out first. 50 SyncResult = collections.namedtuple( 51 'SynResult', ['video_time', 'audio_time', 'time_delay']) 52 53 54 class GrayCode(object): 55 """Converts bit patterns between binary and Gray code. 56 57 The bit patterns of Gray code values are packed into an int value. 58 For example, 4 is "110" in Gray code, which reads "6" when interpreted 59 as binary. 60 See "https://en.wikipedia.org/wiki/Gray_code" 61 62 """ 63 64 @staticmethod 65 def binary_to_gray(binary): 66 """Binary code to gray code. 67 68 @param binary: Binary code. 69 @return: gray code. 70 71 """ 72 return binary ^ (binary >> 1) 73 74 @staticmethod 75 def gray_to_binary(gray): 76 """Gray code to binary code. 77 78 @param gray: Gray code. 79 @return: binary code. 80 81 """ 82 result = gray 83 result ^= (result >> 16) 84 result ^= (result >> 8) 85 result ^= (result >> 4) 86 result ^= (result >> 2) 87 result ^= (result >> 1) 88 return result 89 90 91 class HysteresisSwitch(object): 92 """ 93 Iteratively binarizes input sequence using hysteresis comparator with a 94 pair of fixed thresholds. 95 96 Hysteresis means to use 2 different thresholds 97 for activating and de-activating output. It is often used for thresholding 98 time-series signal while reducing small noise in the input. 99 100 Note that the low threshold is exclusive but the high threshold is 101 inclusive. 102 When the same values were applied for the both, the object works as a 103 non-hysteresis switch. 104 (i.e. equivalent to the >= operator). 105 106 """ 107 108 def __init__(self, low_threshold, high_threshold, init_state): 109 """Init HysteresisSwitch class. 110 111 @param low_threshold: The threshold value to deactivate the output. 112 The comparison is exclusive. 113 @param high_threshold: The threshold value to activate the output. 114 The comparison is inclusive. 115 @param init_state: True or False of the switch initial state. 116 117 """ 118 if low_threshold > high_threshold: 119 raise Exception('Low threshold %d exceeds the high threshold %d', 120 low_threshold, high_threshold) 121 self._low_threshold = low_threshold 122 self._high_threshold = high_threshold 123 self._last_state = init_state 124 125 def adjust_state(self, value): 126 """Updates the state of the switch by the input value and returns the 127 result. 128 129 @param value: value for updating. 130 @return the state of the switch. 131 132 """ 133 if value < self._low_threshold: 134 self._last_state = False 135 136 if value >= self._high_threshold: 137 self._last_state = True 138 139 return self._last_state 140 141 142 class AVSyncProbeDataParser(object): 143 """ Digital information extraction from the raw sensor data sequence. 144 145 This class will transform the raw data to easier understand formats. 146 147 Attributes: 148 binarize_data: Transer the raw data to [Time, video code, is_audio]. 149 video code is from 0-7 repeatedly. 150 video_events: Events of video frame. 151 audio_events: Events of when audio happens. 152 video_duration_average: (ms) The average duration during video frames. 153 video_duration_std: Standard deviation of the video_duration_average. 154 sync_duration_average: (ms) The average duration for audio/video sync. 155 sync_duration_std: Standard deviation of sync_duration_average. 156 cumulative_frame_count: Number of total video frames. 157 dropped_frame_count: Total dropped video frames. 158 corrupted_frame_count: Total corrupted video frames. 159 160 """ 161 # Thresholds for hysteresis binarization of input signals. 162 # Relative to the minumum (0.0) and maximum (1.0) values of the value range 163 # of each input signal. 164 _NORMALIZED_LOW_THRESHOLD = 0.6 165 _NORMALIZED_HIGH_THRESHOLD = 0.7 166 167 _VIDEO_CODE_CYCLE = (1 << 3) 168 169 def __init__(self, log_dir, capture_raw_data, video_fps, 170 sound_interval_frames=None): 171 """Inits AVSyncProbeDataParser class. 172 173 @param log_dir: Directory for dumping each events' contents. 174 @param capture_raw_data: Raw data from avsync_probe device. 175 A list contains the list values of [timestamp, video0, video1, 176 video2, audio]. 177 @param video_fps: Video frames per second. Used to know if the video 178 frame is dropoped or just corrupted. 179 @param sound_interval_frames: The period of sound (beep) in the number 180 of video frames. This class will help to calculate audio/video 181 sync stats if sound_interval_frames is not None. 182 183 """ 184 self.video_duration_average = None 185 self.video_duration_std = None 186 self.sync_duration_average = None 187 self.sync_duration_std = None 188 self.cumulative_frame_count = None 189 self.dropped_frame_count = None 190 191 self._log_dir = log_dir 192 self._raw_data = capture_raw_data 193 # Translate to millisecond for each video frame. 194 self._video_duration = 1000 / video_fps 195 self._sound_interval_frames = sound_interval_frames 196 self._log_list_data_to_file('raw.txt', capture_raw_data) 197 198 self.binarize_data = self._binarize_raw_data() 199 # we need to get audio events before remove video preamble frames. 200 # Because audio event may appear before the preamble frame, if we 201 # remove the preamble frames first, we will lost the audio event. 202 self.audio_events = self._detect_audio_events() 203 self._remove_video_preamble() 204 self.video_events = self._detect_video_events() 205 self._analyze_events() 206 self._calculate_statistics_report() 207 208 def _log_list_data_to_file(self, filename, data): 209 """Log the list data to file. 210 211 It will log under self._log_dir directory. 212 213 @param filename: The file name. 214 @data: Data for logging. 215 216 """ 217 filepath = os.path.join(self._log_dir, filename) 218 with open(filepath, 'w') as f: 219 for v in data: 220 f.write('%s\n' % str(v)) 221 222 def _get_hysteresis_switch(self, index): 223 """Get HysteresisSwitch by the raw data. 224 225 @param index: The index of self._raw_data's element. 226 @return: HysteresisSwitch instance by the value of the raw data. 227 228 """ 229 max_value = max(x[index] for x in self._raw_data) 230 min_value = min(x[index] for x in self._raw_data) 231 scale = max_value - min_value 232 logging.info('index %d, max %d, min %d, scale %d', index, max_value, 233 min_value, scale) 234 return HysteresisSwitch( 235 min_value + scale * self._NORMALIZED_LOW_THRESHOLD, 236 min_value + scale * self._NORMALIZED_HIGH_THRESHOLD, 237 False) 238 239 def _binarize_raw_data(self): 240 """Conducts adaptive thresholding and decoding embedded frame codes. 241 242 Sensors[0] is timestamp. 243 Sensors[1-3] are photo transistors, which outputs lower value for 244 brighter light(=white pixels on screen). These are used to detect black 245 and white pattern on the screen, and decoded as an integer code. 246 247 The final channel is for audio input, which outputs higher voltage for 248 larger sound volume. This will be used for detecting beep sounds added 249 to the video. 250 251 @return Decoded frame codes list for all the input frames. Each entry 252 contains [Timestamp, video code, is_audio]. 253 254 """ 255 decoded_data = [] 256 257 hystersis_switch = [] 258 for i in xrange(5): 259 hystersis_switch.append(self._get_hysteresis_switch(i)) 260 261 for data in self._raw_data: 262 code = 0 263 # Decode black-and-white pattern on video. 264 # There are 3 black or white boxes sensed by the sensors. 265 # Each square represents a single bit (white = 1, black = 0) coding 266 # an integer in Gray code. 267 for i in xrange(1, 4): 268 # Lower sensor value for brighter light(square painted white). 269 is_white = not hystersis_switch[i].adjust_state(data[i]) 270 if is_white: 271 code |= (1 << (i - 1)) 272 code = GrayCode.gray_to_binary(code) 273 # The final channel is sound signal. Higher sensor value for 274 # higher sound level. 275 sound = hystersis_switch[4].adjust_state(data[4]) 276 decoded_data.append([data[0], code, sound]) 277 278 self._log_list_data_to_file('binarize_raw.txt', decoded_data) 279 return decoded_data 280 281 def _remove_video_preamble(self): 282 """Remove preamble video frames of self.binarize_data.""" 283 # find preamble frame (code = 0) 284 index = next(i for i, v in enumerate(self.binarize_data) 285 if v[VIDEO_INDEX] == 0) 286 self.binarize_data = self.binarize_data[index:] 287 288 # skip preamble frame (code = 0) 289 index = next(i for i, v in enumerate(self.binarize_data) 290 if v[VIDEO_INDEX] != 0) 291 self.binarize_data = self.binarize_data[index:] 292 293 def _detect_events(self, detect_condition): 294 """Detects events from the binarize data sequence by the 295 detect_condition. 296 297 @param detect_condition: callback function for checking event happens. 298 This API will pass index and element of binarize_data to the 299 callback function. 300 301 @return: The list of events. It's the same as the binarize_data and add 302 additional time_difference information. 303 304 """ 305 detected_events = [] 306 previous_time = self.binarize_data[0][TIME_INDEX] 307 for i, v in enumerate(self.binarize_data): 308 if (detect_condition(i, v)): 309 time = v[TIME_INDEX] 310 time_difference = time - previous_time 311 # Copy a new instance here, because we will append time 312 # difference. 313 event = list(v) 314 event.append(time_difference) 315 detected_events.append(event) 316 previous_time = time 317 318 return detected_events 319 320 def _detect_audio_events(self): 321 """Detects the audio start frame from the binarize data sequence. 322 323 @return: The list of Audio events. It's the same as the binarize_data 324 and add additional time_difference information. 325 326 """ 327 # Only check the first audio happen event. 328 detected_events = self._detect_events( 329 lambda i, v: (v[AUDIO_INDEX] and not 330 self.binarize_data[i - 1][AUDIO_INDEX])) 331 332 self._log_list_data_to_file('audio_events.txt', detected_events) 333 return detected_events 334 335 def _detect_video_events(self): 336 """Detects the video frame from the binarize data sequence. 337 338 @return: The list of Video events. It's the same as the binarize_data 339 and add additional time_difference information. 340 341 """ 342 # remove duplicate frames. (frames in transition state.) 343 detected_events = self._detect_events( 344 lambda i, v: (v[VIDEO_INDEX] != 345 self.binarize_data[i - 1][VIDEO_INDEX])) 346 347 self._log_list_data_to_file('video_events.txt', detected_events) 348 return detected_events 349 350 def _match_sync(self, video_time): 351 """Match the audio/video sync timing. 352 353 This function will find the closest sound in the audio_events to the 354 video_time and returns a audio/video sync tuple. 355 356 @param video_time: the time of the video which have sound. 357 @return A SyncResult namedtuple containing: 358 - timestamp of the video frame which should have audio. 359 - timestamp of nearest audio frame. 360 - time delay between audio and video frame. 361 362 """ 363 closest_difference = sys.maxint 364 audio_time = 0 365 for audio_event in self.audio_events: 366 difference = audio_event[TIME_INDEX] - video_time 367 if abs(difference) < abs(closest_difference): 368 closest_difference = difference 369 audio_time = audio_event[TIME_INDEX] 370 return SyncResult(video_time, audio_time, closest_difference) 371 372 def _calculate_statistics(self, data): 373 """Calculate average and standard deviation of the list data. 374 375 @param data: The list of values to be calcualted. 376 @return: An tuple with (average, standard_deviation) 377 378 """ 379 if not data: 380 return (None, None) 381 382 total = sum(data) 383 average = total / len(data) 384 variance = sum((v - average)**2 for v in data) / len(data) 385 standard_deviation = math.sqrt(variance) 386 return (average, standard_deviation) 387 388 def _analyze_events(self): 389 """Analyze audio/video events. 390 391 This function will analyze video frame status and audio/video sync 392 status. 393 394 """ 395 sound_interval_frames = self._sound_interval_frames 396 current_code = 0 397 cumulative_frame_count = 0 398 dropped_frame_count = 0 399 corrupted_frame_count = 0 400 sync_events = [] 401 402 for v in self.video_events: 403 code = v[VIDEO_INDEX] 404 time = v[TIME_INDEX] 405 frame_diff = code - current_code 406 # Get difference of the codes. # The code is between 0 - 7. 407 if frame_diff < 0: 408 frame_diff += self._VIDEO_CODE_CYCLE 409 410 if frame_diff != 1: 411 # Check if we dropped frame or just got corrupted frame. 412 # Treat the frame as corrupted frame if the frame duration is 413 # less than 2 video frame duration. 414 if v[TIME_DIFF_INDEX] < 2 * self._video_duration: 415 logging.warn('Corrupted frame near %s', str(v)) 416 # Correct the code. 417 code = current_code + 1 418 corrupted_frame_count += 1 419 frame_diff = 1 420 else: 421 logging.warn('Dropped frame near %s', str(v)) 422 dropped_frame_count += (frame_diff - 1) 423 424 cumulative_frame_count += frame_diff 425 426 if sound_interval_frames is not None: 427 # This frame corresponds to a sound. 428 if cumulative_frame_count % sound_interval_frames == 1: 429 sync_events.append(self._match_sync(time)) 430 431 current_code = code 432 self.cumulative_frame_count = cumulative_frame_count 433 self.dropped_frame_count = dropped_frame_count 434 self.corrupted_frame_count = corrupted_frame_count 435 self._sync_events = sync_events 436 self._log_list_data_to_file('sync.txt', sync_events) 437 438 def _calculate_statistics_report(self): 439 """Calculates statistics report.""" 440 video_duration_average, video_duration_std = self._calculate_statistics( 441 [v[TIME_DIFF_INDEX] for v in self.video_events]) 442 sync_duration_average, sync_duration_std = self._calculate_statistics( 443 [v.time_delay for v in self._sync_events]) 444 self.video_duration_average = video_duration_average 445 self.video_duration_std = video_duration_std 446 self.sync_duration_average = sync_duration_average 447 self.sync_duration_std = sync_duration_std 448