1 # 2 # this is a rather strict implementation of a bit vector class 3 # it is accessed the same way as an array of python-ints, except 4 # the value must be 0 or 1 5 # 6 7 import sys; rprt = sys.stderr.write #for debugging 8 9 class error(Exception): 10 pass 11 12 13 def _check_value(value): 14 if type(value) != type(0) or not 0 <= value < 2: 15 raise error, 'bitvec() items must have int value 0 or 1' 16 17 18 import math 19 20 def _compute_len(param): 21 mant, l = math.frexp(float(param)) 22 bitmask = 1L << l 23 if bitmask <= param: 24 raise RuntimeError('(param, l) = %r' % ((param, l),)) 25 while l: 26 bitmask = bitmask >> 1 27 if param & bitmask: 28 break 29 l = l - 1 30 return l 31 32 33 def _check_key(len, key): 34 if type(key) != type(0): 35 raise TypeError, 'sequence subscript not int' 36 if key < 0: 37 key = key + len 38 if not 0 <= key < len: 39 raise IndexError, 'list index out of range' 40 return key 41 42 def _check_slice(len, i, j): 43 #the type is ok, Python already checked that 44 i, j = max(i, 0), min(len, j) 45 if i > j: 46 i = j 47 return i, j 48 49 50 class BitVec: 51 52 def __init__(self, *params): 53 self._data = 0L 54 self._len = 0 55 if not len(params): 56 pass 57 elif len(params) == 1: 58 param, = params 59 if type(param) == type([]): 60 value = 0L 61 bit_mask = 1L 62 for item in param: 63 # strict check 64 #_check_value(item) 65 if item: 66 value = value | bit_mask 67 bit_mask = bit_mask << 1 68 self._data = value 69 self._len = len(param) 70 elif type(param) == type(0L): 71 if param < 0: 72 raise error, 'bitvec() can\'t handle negative longs' 73 self._data = param 74 self._len = _compute_len(param) 75 else: 76 raise error, 'bitvec() requires array or long parameter' 77 elif len(params) == 2: 78 param, length = params 79 if type(param) == type(0L): 80 if param < 0: 81 raise error, \ 82 'can\'t handle negative longs' 83 self._data = param 84 if type(length) != type(0): 85 raise error, 'bitvec()\'s 2nd parameter must be int' 86 computed_length = _compute_len(param) 87 if computed_length > length: 88 print 'warning: bitvec() value is longer than the length indicates, truncating value' 89 self._data = self._data & \ 90 ((1L << length) - 1) 91 self._len = length 92 else: 93 raise error, 'bitvec() requires array or long parameter' 94 else: 95 raise error, 'bitvec() requires 0 -- 2 parameter(s)' 96 97 98 def append(self, item): 99 #_check_value(item) 100 #self[self._len:self._len] = [item] 101 self[self._len:self._len] = \ 102 BitVec(long(not not item), 1) 103 104 105 def count(self, value): 106 #_check_value(value) 107 if value: 108 data = self._data 109 else: 110 data = (~self)._data 111 count = 0 112 while data: 113 data, count = data >> 1, count + (data & 1 != 0) 114 return count 115 116 117 def index(self, value): 118 #_check_value(value): 119 if value: 120 data = self._data 121 else: 122 data = (~self)._data 123 index = 0 124 if not data: 125 raise ValueError, 'list.index(x): x not in list' 126 while not (data & 1): 127 data, index = data >> 1, index + 1 128 return index 129 130 131 def insert(self, index, item): 132 #_check_value(item) 133 #self[index:index] = [item] 134 self[index:index] = BitVec(long(not not item), 1) 135 136 137 def remove(self, value): 138 del self[self.index(value)] 139 140 141 def reverse(self): 142 #ouch, this one is expensive! 143 #for i in self._len>>1: self[i], self[l-i] = self[l-i], self[i] 144 data, result = self._data, 0L 145 for i in range(self._len): 146 if not data: 147 result = result << (self._len - i) 148 break 149 result, data = (result << 1) | (data & 1), data >> 1 150 self._data = result 151 152 153 def sort(self): 154 c = self.count(1) 155 self._data = ((1L << c) - 1) << (self._len - c) 156 157 158 def copy(self): 159 return BitVec(self._data, self._len) 160 161 162 def seq(self): 163 result = [] 164 for i in self: 165 result.append(i) 166 return result 167 168 169 def __repr__(self): 170 ##rprt('<bitvec class instance object>.' + '__repr__()\n') 171 return 'bitvec(%r, %r)' % (self._data, self._len) 172 173 def __cmp__(self, other, *rest): 174 #rprt('%r.__cmp__%r\n' % (self, (other,) + rest)) 175 if type(other) != type(self): 176 other = apply(bitvec, (other, ) + rest) 177 #expensive solution... recursive binary, with slicing 178 length = self._len 179 if length == 0 or other._len == 0: 180 return cmp(length, other._len) 181 if length != other._len: 182 min_length = min(length, other._len) 183 return cmp(self[:min_length], other[:min_length]) or \ 184 cmp(self[min_length:], other[min_length:]) 185 #the lengths are the same now... 186 if self._data == other._data: 187 return 0 188 if length == 1: 189 return cmp(self[0], other[0]) 190 else: 191 length = length >> 1 192 return cmp(self[:length], other[:length]) or \ 193 cmp(self[length:], other[length:]) 194 195 196 def __len__(self): 197 #rprt('%r.__len__()\n' % (self,)) 198 return self._len 199 200 def __getitem__(self, key): 201 #rprt('%r.__getitem__(%r)\n' % (self, key)) 202 key = _check_key(self._len, key) 203 return self._data & (1L << key) != 0 204 205 def __setitem__(self, key, value): 206 #rprt('%r.__setitem__(%r, %r)\n' % (self, key, value)) 207 key = _check_key(self._len, key) 208 #_check_value(value) 209 if value: 210 self._data = self._data | (1L << key) 211 else: 212 self._data = self._data & ~(1L << key) 213 214 def __delitem__(self, key): 215 #rprt('%r.__delitem__(%r)\n' % (self, key)) 216 key = _check_key(self._len, key) 217 #el cheapo solution... 218 self._data = self[:key]._data | self[key+1:]._data >> key 219 self._len = self._len - 1 220 221 def __getslice__(self, i, j): 222 #rprt('%r.__getslice__(%r, %r)\n' % (self, i, j)) 223 i, j = _check_slice(self._len, i, j) 224 if i >= j: 225 return BitVec(0L, 0) 226 if i: 227 ndata = self._data >> i 228 else: 229 ndata = self._data 230 nlength = j - i 231 if j != self._len: 232 #we'll have to invent faster variants here 233 #e.g. mod_2exp 234 ndata = ndata & ((1L << nlength) - 1) 235 return BitVec(ndata, nlength) 236 237 def __setslice__(self, i, j, sequence, *rest): 238 #rprt('%s.__setslice__%r\n' % (self, (i, j, sequence) + rest)) 239 i, j = _check_slice(self._len, i, j) 240 if type(sequence) != type(self): 241 sequence = apply(bitvec, (sequence, ) + rest) 242 #sequence is now of our own type 243 ls_part = self[:i] 244 ms_part = self[j:] 245 self._data = ls_part._data | \ 246 ((sequence._data | \ 247 (ms_part._data << sequence._len)) << ls_part._len) 248 self._len = self._len - j + i + sequence._len 249 250 def __delslice__(self, i, j): 251 #rprt('%r.__delslice__(%r, %r)\n' % (self, i, j)) 252 i, j = _check_slice(self._len, i, j) 253 if i == 0 and j == self._len: 254 self._data, self._len = 0L, 0 255 elif i < j: 256 self._data = self[:i]._data | (self[j:]._data >> i) 257 self._len = self._len - j + i 258 259 def __add__(self, other): 260 #rprt('%r.__add__(%r)\n' % (self, other)) 261 retval = self.copy() 262 retval[self._len:self._len] = other 263 return retval 264 265 def __mul__(self, multiplier): 266 #rprt('%r.__mul__(%r)\n' % (self, multiplier)) 267 if type(multiplier) != type(0): 268 raise TypeError, 'sequence subscript not int' 269 if multiplier <= 0: 270 return BitVec(0L, 0) 271 elif multiplier == 1: 272 return self.copy() 273 #handle special cases all 0 or all 1... 274 if self._data == 0L: 275 return BitVec(0L, self._len * multiplier) 276 elif (~self)._data == 0L: 277 return ~BitVec(0L, self._len * multiplier) 278 #otherwise el cheapo again... 279 retval = BitVec(0L, 0) 280 while multiplier: 281 retval, multiplier = retval + self, multiplier - 1 282 return retval 283 284 def __and__(self, otherseq, *rest): 285 #rprt('%r.__and__%r\n' % (self, (otherseq,) + rest)) 286 if type(otherseq) != type(self): 287 otherseq = apply(bitvec, (otherseq, ) + rest) 288 #sequence is now of our own type 289 return BitVec(self._data & otherseq._data, \ 290 min(self._len, otherseq._len)) 291 292 293 def __xor__(self, otherseq, *rest): 294 #rprt('%r.__xor__%r\n' % (self, (otherseq,) + rest)) 295 if type(otherseq) != type(self): 296 otherseq = apply(bitvec, (otherseq, ) + rest) 297 #sequence is now of our own type 298 return BitVec(self._data ^ otherseq._data, \ 299 max(self._len, otherseq._len)) 300 301 302 def __or__(self, otherseq, *rest): 303 #rprt('%r.__or__%r\n' % (self, (otherseq,) + rest)) 304 if type(otherseq) != type(self): 305 otherseq = apply(bitvec, (otherseq, ) + rest) 306 #sequence is now of our own type 307 return BitVec(self._data | otherseq._data, \ 308 max(self._len, otherseq._len)) 309 310 311 def __invert__(self): 312 #rprt('%r.__invert__()\n' % (self,)) 313 return BitVec(~self._data & ((1L << self._len) - 1), \ 314 self._len) 315 316 def __coerce__(self, otherseq, *rest): 317 #needed for *some* of the arithmetic operations 318 #rprt('%r.__coerce__%r\n' % (self, (otherseq,) + rest)) 319 if type(otherseq) != type(self): 320 otherseq = apply(bitvec, (otherseq, ) + rest) 321 return self, otherseq 322 323 def __int__(self): 324 return int(self._data) 325 326 def __long__(self): 327 return long(self._data) 328 329 def __float__(self): 330 return float(self._data) 331 332 333 bitvec = BitVec 334