mygpo/utils.py

   1 #
   2 # This file is part of my.gpodder.org.
   3 #
   4 # my.gpodder.org is free software: you can redistribute it and/or modify it
   5 # under the terms of the GNU Affero General Public License as published by
   6 # the Free Software Foundation, either version 3 of the License, or (at your
   7 # option) any later version.
   8 #
   9 # my.gpodder.org is distributed in the hope that it will be useful, but
  10 # WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
  11 # or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Affero General Public
  12 # License for more details.
  13 #
  14 # You should have received a copy of the GNU Affero General Public License
  15 # along with my.gpodder.org. If not, see <http://www.gnu.org/licenses/>.
  16 #
  17
  18 import functools
  19 import types
  20 import subprocess
  21 import os
  22 import operator
  23 import sys
  24 import re
  25 import collections
  26 from datetime import datetime, timedelta, date
  27 import time
  28 import hashlib
  29 import urlparse
  30 import urllib
  31 import urllib2
  32 import zlib
  33
  34 from django.conf import settings
  35
  36 from mygpo.core.json import json
  37
  38
  39 def daterange(from_date, to_date=None, leap=timedelta(days=1)):
  40     """
  41     >>> from_d = datetime(2010, 01, 01)
  42     >>> to_d = datetime(2010, 01, 05)
  43     >>> list(daterange(from_d, to_d))
  44     [datetime.datetime(2010, 1, 1, 0, 0), datetime.datetime(2010, 1, 2, 0, 0), datetime.datetime(2010, 1, 3, 0, 0), datetime.datetime(2010, 1, 4, 0, 0), datetime.datetime(2010, 1, 5, 0, 0)]
  45     """
  46
  47     if to_date is None:
  48         if isinstance(from_date, datetime):
  49             to_date = datetime.now()
  50         else:
  51             to_date = date.today()
  52
  53     while from_date <= to_date:
  54         yield from_date
  55         from_date = from_date + leap
  56     return
  57
  58 def format_time(value):
  59     """Format an offset (in seconds) to a string
  60
  61     The offset should be an integer or float value.
  62
  63     >>> format_time(0)
  64     '00:00'
  65     >>> format_time(20)
  66     '00:20'
  67     >>> format_time(3600)
  68     '01:00:00'
  69     >>> format_time(10921)
  70     '03:02:01'
  71     """
  72     try:
  73         dt = datetime.utcfromtimestamp(value)
  74     except ValueError:
  75         return ''
  76
  77     if dt.hour == 0:
  78         return dt.strftime('%M:%S')
  79     else:
  80         return dt.strftime('%H:%M:%S')
  81
  82 def parse_time(value):
  83     """
  84     >>> parse_time(10)
  85     10
  86
  87     >>> parse_time('05:10') #5*60+10
  88     310
  89
  90     >>> parse_time('1:05:10') #60*60+5*60+10
  91     3910
  92     """
  93     if value is None:
  94         raise ValueError('None value in parse_time')
  95
  96     if isinstance(value, int):
  97         # Don't need to parse already-converted time value
  98         return value
  99
 100     if value == '':
 101         raise ValueError('Empty valueing in parse_time')
 102
 103     for format in ('%H:%M:%S', '%M:%S'):
 104         try:
 105             t = time.strptime(value, format)
 106             return t.tm_hour * 60*60 + t.tm_min * 60 + t.tm_sec
 107         except ValueError, e:
 108             continue
 109
 110     return int(value)
 111
 112
 113 def parse_bool(val):
 114     """
 115     >>> parse_bool('True')
 116     True
 117
 118     >>> parse_bool('true')
 119     True
 120
 121     >>> parse_bool('')
 122     False
 123     """
 124     if isinstance(val, bool):
 125         return val
 126     if val.lower() == 'true':
 127         return True
 128     return False
 129
 130
 131 def iterate_together(lists, key=lambda x: x, reverse=False):
 132     """
 133     takes ordered, possibly sparse, lists with similar items
 134     (some items have a corresponding item in the other lists, some don't).
 135
 136     It then yield tuples of corresponding items, where one element is None is
 137     there is no corresponding entry in one of the lists.
 138
 139     Tuples where both elements are None are skipped.
 140
 141     The results of the key method are used for the comparisons.
 142
 143     If reverse is True, the lists are expected to be sorted in reverse order
 144     and the results will also be sorted reverse
 145
 146     >>> list(iterate_together([range(1, 3), range(1, 4, 2)]))
 147     [(1, 1), (2, None), (None, 3)]
 148
 149     >>> list(iterate_together([[], []]))
 150     []
 151
 152     >>> list(iterate_together([range(1, 3), range(3, 5)]))
 153     [(1, None), (2, None), (None, 3), (None, 4)]
 154
 155     >>> list(iterate_together([range(1, 3), []]))
 156     [(1, None), (2, None)]
 157
 158     >>> list(iterate_together([[1, None, 3], [None, None, 3]]))
 159     [(1, None), (3, 3)]
 160     """
 161
 162     Next = collections.namedtuple('Next', 'item more')
 163     min_ = min if not reverse else max
 164     lt_  = operator.lt if not reverse else operator.gt
 165
 166     lists = [iter(l) for l in lists]
 167
 168     def _take(it):
 169         try:
 170             i = it.next()
 171             while i is None:
 172                 i = it.next()
 173             return Next(i, True)
 174         except StopIteration:
 175             return Next(None, False)
 176
 177     def new_res():
 178         return [None]*len(lists)
 179
 180     # take first bunch of items
 181     items = [_take(l) for l in lists]
 182
 183     while any(i.item is not None or i.more for i in items):
 184
 185         res = new_res()
 186
 187         for n, item in enumerate(items):
 188
 189             if item.item is None:
 190                 continue
 191
 192             if all(x is None for x in res):
 193                 res[n] = item.item
 194                 continue
 195
 196             min_v = min_(filter(lambda x: x is not None, res), key=key)
 197
 198             if key(item.item) == key(min_v):
 199                 res[n] = item.item
 200
 201             elif lt_(key(item.item), key(min_v)):
 202                 res = new_res()
 203                 res[n] = item.item
 204
 205         for n, x in enumerate(res):
 206             if x is not None:
 207                 items[n] = _take(lists[n])
 208
 209         yield tuple(res)
 210
 211
 212 def progress(val, max_val, status_str='', max_width=50, stream=sys.stdout):
 213
 214     factor = float(val)/max_val if max_val > 0 else 0
 215
 216     # progress as percentage
 217     percentage_str = '{val:.2%}'.format(val=factor)
 218
 219     # progress bar filled with #s
 220     factor = min(int(factor*max_width), max_width)
 221     progress_str = '#' * factor + ' ' * (max_width-factor)
 222
 223     #insert percentage into bar
 224     percentage_start = int((max_width-len(percentage_str))/2)
 225     progress_str = progress_str[:percentage_start] + \
 226                    percentage_str + \
 227                    progress_str[percentage_start+len(percentage_str):]
 228
 229     print >> stream, '\r',
 230     print >> stream, '[ %s ] %s / %s | %s' % (
 231         progress_str,
 232         val,
 233         max_val,
 234         status_str),
 235     stream.flush()
 236
 237
 238 def set_cmp(list, simplify):
 239     """
 240     Builds a set out of a list but uses the results of simplify to determine equality between items
 241     """
 242     simpl = lambda x: (simplify(x), x)
 243     lst = dict(map(simpl, list))
 244     return lst.values()
 245
 246
 247 def first(it):
 248     """
 249     returns the first not-None object or None if the iterator is exhausted
 250     """
 251     for x in it:
 252         if x is not None:
 253             return x
 254     return None
 255
 256
 257 def intersect(a, b):
 258     return list(set(a) & set(b))
 259
 260
 261
 262 def remove_control_chars(s):
 263     all_chars = (unichr(i) for i in xrange(0x110000))
 264     control_chars = ''.join(map(unichr, range(0,32) + range(127,160)))
 265     control_char_re = re.compile('[%s]' % re.escape(control_chars))
 266
 267     return control_char_re.sub('', s)
 268
 269
 270 def unzip(a):
 271     return tuple(map(list,zip(*a)))
 272
 273
 274 def parse_range(s, min, max, default=None):
 275     """
 276     Parses the string and returns its value. If the value is outside the given
 277     range, its closest number within the range is returned
 278
 279     >>> parse_range('5', 0, 10)
 280     5
 281
 282     >>> parse_range('0', 5, 10)
 283     5
 284
 285     >>> parse_range('15',0, 10)
 286     10
 287
 288     >>> parse_range('x', 0, 20)
 289     10
 290
 291     >>> parse_range('x', 0, 20, 20)
 292     20
 293     """
 294     try:
 295         val = int(s)
 296         if val < min:
 297             return min
 298         if val > max:
 299             return max
 300         return val
 301
 302     except (ValueError, TypeError):
 303         return default if default is not None else (max-min)/2
 304
 305
 306
 307 def flatten(l):
 308     return [item for sublist in l for item in sublist]
 309
 310
 311 def linearize(key, iterators, reverse=False):
 312     """
 313     Linearizes a number of iterators, sorted by some comparison function
 314     """
 315
 316     iters = [iter(i) for i in iterators]
 317     vals = []
 318     for i in iters:
 319         try:
 320             v = i.next()
 321             vals. append( (v, i) )
 322         except StopIteration:
 323             continue
 324
 325     while vals:
 326         vals = sorted(vals, key=lambda x: key(x[0]), reverse=reverse)
 327         val, it = vals.pop(0)
 328         yield val
 329         try:
 330             next_val = it.next()
 331             vals.append( (next_val, it) )
 332         except StopIteration:
 333             pass
 334
 335
 336 def skip_pairs(iterator, cmp=cmp):
 337     """ Skips pairs of equal items
 338
 339     >>> list(skip_pairs([]))
 340     []
 341
 342     >>> list(skip_pairs([1]))
 343     [1]
 344
 345     >>> list(skip_pairs([1, 2, 3]))
 346     [1, 2, 3]
 347
 348     >>> list(skip_pairs([1, 1]))
 349     []
 350
 351     >>> list(skip_pairs([1, 2, 2]))
 352     [1]
 353
 354     >>> list(skip_pairs([1, 2, 2, 3]))
 355     [1, 3]
 356
 357     >>> list(skip_pairs([1, 2, 2, 2]))
 358     [1, 2]
 359
 360     >>> list(skip_pairs([1, 2, 2, 2, 2, 3]))
 361     [1, 3]
 362     """
 363
 364     iterator = iter(iterator)
 365     next = iterator.next()
 366
 367     while True:
 368         item = next
 369         try:
 370             next = iterator.next()
 371         except StopIteration as e:
 372             yield item
 373             raise e
 374
 375         if cmp(item, next) == 0:
 376             next = iterator.next()
 377         else:
 378             yield item
 379
 380
 381 def get_timestamp(datetime_obj):
 382     """ Returns the timestamp as an int for the given datetime object
 383
 384     >>> get_timestamp(datetime(2011, 4, 7, 9, 30, 6))
 385     1302168606
 386
 387     >>> get_timestamp(datetime(1970, 1, 1, 0, 0, 0))
 388     0
 389     """
 390     return int(time.mktime(datetime_obj.timetuple()))
 391
 392
 393
 394 re_url = re.compile('^https?://')
 395
 396 def is_url(string):
 397     """ Returns true if a string looks like an URL
 398
 399     >>> is_url('http://example.com/some-path/file.xml')
 400     True
 401
 402     >>> is_url('something else')
 403     False
 404     """
 405
 406     return bool(re_url.match(string))
 407
 408
 409
 410 # from http://stackoverflow.com/questions/2892931/longest-common-substring-from-more-than-two-strings-python
 411 # this does not increase asymptotical complexity
 412 # but can still waste more time than it saves.
 413 def shortest_of(strings):
 414     return min(strings, key=len)
 415
 416 def longest_substr(strings):
 417     """
 418     Returns the longest common substring of the given strings
 419     """
 420
 421     substr = ""
 422     if not strings:
 423         return substr
 424     reference = shortest_of(strings)
 425     length = len(reference)
 426     #find a suitable slice i:j
 427     for i in xrange(length):
 428         #only consider strings long at least len(substr) + 1
 429         for j in xrange(i + len(substr) + 1, length):
 430             candidate = reference[i:j]
 431             if all(candidate in text for text in strings):
 432                 substr = candidate
 433     return substr
 434
 435
 436
 437 def additional_value(it, gen_val, val_changed=lambda _: True):
 438     """ Provides an additional value to the elements, calculated when needed
 439
 440     For the elements from the iterator, some additional value can be computed
 441     by gen_val (which might be an expensive computation).
 442
 443     If the elements in the iterator are ordered so that some subsequent
 444     elements would generate the same additional value, val_changed can be
 445     provided, which receives the next element from the iterator and the
 446     previous additional value. If the element would generate the same
 447     additional value (val_changed returns False), its computation is skipped.
 448
 449     >>> # get the next full hundred higher than x
 450     >>> # this will probably be an expensive calculation
 451     >>> next_hundred = lambda x: x + 100-(x % 100)
 452
 453     >>> # returns True if h is not the value that next_hundred(x) would provide
 454     >>> # this should be a relatively cheap calculation, compared to the above
 455     >>> diff_hundred = lambda x, h: (h-x) < 0 or (h - x) > 100
 456
 457     >>> xs = [0, 50, 100, 101, 199, 200, 201]
 458     >>> list(additional_value(xs, next_hundred, diff_hundred))
 459     [(0, 100), (50, 100), (100, 100), (101, 200), (199, 200), (200, 200), (201, 300)]
 460     """
 461
 462     _none = object()
 463     current = _none
 464
 465     for x in it:
 466         if current is _none or val_changed(x, current):
 467             current = gen_val(x)
 468
 469         yield (x, current)
 470
 471
 472 def file_hash(f, h=hashlib.md5, block_size=2**20):
 473     """ returns the hash of the contents of a file """
 474     f_hash = h()
 475     for chunk in iter(lambda: f.read(block_size), ''):
 476         f_hash.update(chunk)
 477     return f_hash
 478
 479
 480
 481 def split_list(l, prop):
 482     """ split elements that satisfy a property, and those that don't """
 483     match   = filter(prop, l)
 484     nomatch = [x for x in l if x not in match]
 485     return match, nomatch
 486
 487
 488 def sorted_chain(links, key, reverse=False):
 489     """ Takes a list of iters can iterates over sorted elements
 490
 491     Each elment of links should be a tuple of (sort_key, iterator). The
 492     elements of each iterator should be sorted already. sort_key should
 493     indicate the key of the first element and needs to be comparable to the
 494     result of key(elem).
 495
 496     The function returns an iterator over the globally sorted element that
 497     ensures that as little iterators as possible are evaluated.  When
 498     evaluating """
 499
 500     # mixed_list initially contains all placeholders; later evaluated
 501     # elements (from the iterators) are mixed in
 502     mixed_list = [(k, link, True) for k, link in links]
 503
 504     while mixed_list:
 505         _, item, expand = mixed_list.pop(0)
 506
 507         # found an element (from an earlier expansion), yield it
 508         if not expand:
 509             yield item
 510             continue
 511
 512         # found an iter that needs to be expanded.
 513         # The iterator is fully consumed
 514         new_items = [(key(i), i, False) for i in item]
 515
 516         # sort links (placeholders) and elements together
 517         mixed_list = sorted(mixed_list + new_items, key=lambda (k, _v, _e): k,
 518                 reverse=reverse)
 519
 520
 521 def url_add_authentication(url, username, password):
 522     """
 523     Adds authentication data (username, password) to a given
 524     URL in order to construct an authenticated URL.
 525
 526     >>> url_add_authentication('https://host.com/', '', None)
 527     'https://host.com/'
 528     >>> url_add_authentication('http://example.org/', None, None)
 529     'http://example.org/'
 530     >>> url_add_authentication('telnet://host.com/', 'foo', 'bar')
 531     'telnet://foo:bar@host.com/'
 532     >>> url_add_authentication('ftp://example.org', 'billy', None)
 533     'ftp://billy@example.org'
 534     >>> url_add_authentication('ftp://example.org', 'billy', '')
 535     'ftp://billy:@example.org'
 536     >>> url_add_authentication('http://localhost/x', 'aa', 'bc')
 537     'http://aa:bc@localhost/x'
 538     >>> url_add_authentication('http://blubb.lan/u.html', 'i/o', 'P@ss:')
 539     'http://i%2Fo:P@ss:@blubb.lan/u.html'
 540     >>> url_add_authentication('http://a:b@x.org/', 'c', 'd')
 541     'http://c:d@x.org/'
 542     >>> url_add_authentication('http://i%2F:P%40%3A@cx.lan', 'P@x', 'i/')
 543     'http://P@x:i%2F@cx.lan'
 544     >>> url_add_authentication('http://x.org/', 'a b', 'c d')
 545     'http://a%20b:c%20d@x.org/'
 546     """
 547     if username is None or username == '':
 548         return url
 549
 550     # Relaxations of the strict quoting rules (bug 1521):
 551     # 1. Accept '@' in username and password
 552     # 2. Acecpt ':' in password only
 553     username = urllib.quote(username, safe='@')
 554
 555     if password is not None:
 556         password = urllib.quote(password, safe='@:')
 557         auth_string = ':'.join((username, password))
 558     else:
 559         auth_string = username
 560
 561     url = url_strip_authentication(url)
 562
 563     url_parts = list(urlparse.urlsplit(url))
 564     # url_parts[1] is the HOST part of the URL
 565     url_parts[1] = '@'.join((auth_string, url_parts[1]))
 566
 567     return urlparse.urlunsplit(url_parts)
 568
 569
 570 def urlopen(url, headers=None, data=None):
 571     """
 572     An URL opener with the User-agent set to gPodder (with version)
 573     """
 574     username, password = username_password_from_url(url)
 575     if username is not None or password is not None:
 576         url = url_strip_authentication(url)
 577         password_mgr = urllib2.HTTPPasswordMgrWithDefaultRealm()
 578         password_mgr.add_password(None, url, username, password)
 579         handler = urllib2.HTTPBasicAuthHandler(password_mgr)
 580         opener = urllib2.build_opener(handler)
 581     else:
 582         opener = urllib2.build_opener()
 583
 584     if headers is None:
 585         headers = {}
 586     else:
 587         headers = dict(headers)
 588
 589     headers.update({'User-agent': settings.USER_AGENT})
 590     request = urllib2.Request(url, data=data, headers=headers)
 591     return opener.open(request)
 592
 593
 594
 595 def username_password_from_url(url):
 596     r"""
 597     Returns a tuple (username,password) containing authentication
 598     data from the specified URL or (None,None) if no authentication
 599     data can be found in the URL.
 600
 601     See Section 3.1 of RFC 1738 (http://www.ietf.org/rfc/rfc1738.txt)
 602
 603     >>> username_password_from_url('https://@host.com/')
 604     ('', None)
 605     >>> username_password_from_url('telnet://host.com/')
 606     (None, None)
 607     >>> username_password_from_url('ftp://foo:@host.com/')
 608     ('foo', '')
 609     >>> username_password_from_url('http://a:b@host.com/')
 610     ('a', 'b')
 611     >>> username_password_from_url(1)
 612     Traceback (most recent call last):
 613       ...
 614     ValueError: URL has to be a string or unicode object.
 615     >>> username_password_from_url(None)
 616     Traceback (most recent call last):
 617       ...
 618     ValueError: URL has to be a string or unicode object.
 619     >>> username_password_from_url('http://a@b:c@host.com/')
 620     ('a@b', 'c')
 621     >>> username_password_from_url('ftp://a:b:c@host.com/')
 622     ('a', 'b:c')
 623     >>> username_password_from_url('http://i%2Fo:P%40ss%3A@host.com/')
 624     ('i/o', 'P@ss:')
 625     >>> username_password_from_url('ftp://%C3%B6sterreich@host.com/')
 626     ('\xc3\xb6sterreich', None)
 627     >>> username_password_from_url('http://w%20x:y%20z@example.org/')
 628     ('w x', 'y z')
 629     >>> username_password_from_url('http://example.com/x@y:z@test.com/')
 630     (None, None)
 631     """
 632     if type(url) not in (str, unicode):
 633         raise ValueError('URL has to be a string or unicode object.')
 634
 635     (username, password) = (None, None)
 636
 637     (scheme, netloc, path, params, query, fragment) = urlparse.urlparse(url)
 638
 639     if '@' in netloc:
 640         (authentication, netloc) = netloc.rsplit('@', 1)
 641         if ':' in authentication:
 642             (username, password) = authentication.split(':', 1)
 643
 644             # RFC1738 dictates that we should not allow ['/', '@', ':']
 645             # characters in the username and password field (Section 3.1):
 646             #
 647             # 1. The "/" can't be in there at this point because of the way
 648             #    urlparse (which we use above) works.
 649             # 2. Due to gPodder bug 1521, we allow "@" in the username and
 650             #    password field. We use netloc.rsplit('@', 1), which will
 651             #    make sure that we split it at the last '@' in netloc.
 652             # 3. The colon must be excluded (RFC2617, Section 2) in the
 653             #    username, but is apparently allowed in the password. This
 654             #    is handled by the authentication.split(':', 1) above, and
 655             #    will cause any extraneous ':'s to be part of the password.
 656
 657             username = urllib.unquote(username)
 658             password = urllib.unquote(password)
 659         else:
 660             username = urllib.unquote(authentication)
 661
 662     return (username, password)
 663
 664
 665 def url_strip_authentication(url):
 666     """
 667     Strips authentication data from an URL. Returns the URL with
 668     the authentication data removed from it.
 669
 670     >>> url_strip_authentication('https://host.com/')
 671     'https://host.com/'
 672     >>> url_strip_authentication('telnet://foo:bar@host.com/')
 673     'telnet://host.com/'
 674     >>> url_strip_authentication('ftp://billy@example.org')
 675     'ftp://example.org'
 676     >>> url_strip_authentication('ftp://billy:@example.org')
 677     'ftp://example.org'
 678     >>> url_strip_authentication('http://aa:bc@localhost/x')
 679     'http://localhost/x'
 680     >>> url_strip_authentication('http://i%2Fo:P%40ss%3A@blubb.lan/u.html')
 681     'http://blubb.lan/u.html'
 682     >>> url_strip_authentication('http://c:d@x.org/')
 683     'http://x.org/'
 684     >>> url_strip_authentication('http://P%40%3A:i%2F@cx.lan')
 685     'http://cx.lan'
 686     >>> url_strip_authentication('http://x@x.com:s3cret@example.com/')
 687     'http://example.com/'
 688     """
 689     url_parts = list(urlparse.urlsplit(url))
 690     # url_parts[1] is the HOST part of the URL
 691
 692     # Remove existing authentication data
 693     if '@' in url_parts[1]:
 694         url_parts[1] = url_parts[1].rsplit('@', 1)[1]
 695
 696     return urlparse.urlunsplit(url_parts)
 697
 698
 699 # Native filesystem encoding detection
 700 encoding = sys.getfilesystemencoding()
 701
 702 def sanitize_encoding(filename):
 703     r"""
 704     Generate a sanitized version of a string (i.e.
 705     remove invalid characters and encode in the
 706     detected native language encoding).
 707
 708     >>> sanitize_encoding('\x80')
 709     ''
 710     >>> sanitize_encoding(u'unicode')
 711     'unicode'
 712     """
 713     # The encoding problem goes away in Python 3.. hopefully!
 714     if sys.version_info >= (3, 0):
 715         return filename
 716
 717     global encoding
 718     if not isinstance(filename, unicode):
 719         filename = filename.decode(encoding, 'ignore')
 720     return filename.encode(encoding, 'ignore')
 721
 722
 723 def get_git_head():
 724     """ returns the commit and message of the current git HEAD """
 725
 726     try:
 727         pr = subprocess.Popen('/usr/bin/git log -n 1 --oneline'.split(),
 728             cwd = settings.BASE_DIR,
 729             stdout = subprocess.PIPE,
 730             stderr = subprocess.PIPE,
 731         )
 732
 733     except OSError:
 734         return None, None
 735
 736     (out, err) = pr.communicate()
 737     if err:
 738         return None, None
 739
 740     outs = out.split()
 741     commit = outs[0]
 742     msg = ' ' .join(outs[1:])
 743     return commit, msg
 744
 745
 746
 747 # https://gist.github.com/samuraisam/901117
 748
 749 default_fudge = timedelta(seconds=0, microseconds=0, days=0)
 750
 751 def deep_eq(_v1, _v2, datetime_fudge=default_fudge, _assert=False):
 752   """
 753   Tests for deep equality between two python data structures recursing
 754   into sub-structures if necessary. Works with all python types including
 755   iterators and generators. This function was dreampt up to test API responses
 756   but could be used for anything. Be careful. With deeply nested structures
 757   you may blow the stack.
 758
 759   Options:
 760             datetime_fudge => this is a datetime.timedelta object which, when
 761                               comparing dates, will accept values that differ
 762                               by the number of seconds specified
 763             _assert        => passing yes for this will raise an assertion error
 764                               when values do not match, instead of returning
 765                               false (very useful in combination with pdb)
 766
 767   Doctests included:
 768
 769   >>> x1, y1 = ({'a': 'b'}, {'a': 'b'})
 770   >>> deep_eq(x1, y1)
 771   True
 772   >>> x2, y2 = ({'a': 'b'}, {'b': 'a'})
 773   >>> deep_eq(x2, y2)
 774   False
 775   >>> x3, y3 = ({'a': {'b': 'c'}}, {'a': {'b': 'c'}})
 776   >>> deep_eq(x3, y3)
 777   True
 778   >>> x4, y4 = ({'c': 't', 'a': {'b': 'c'}}, {'a': {'b': 'n'}, 'c': 't'})
 779   >>> deep_eq(x4, y4)
 780   False
 781   >>> x5, y5 = ({'a': [1,2,3]}, {'a': [1,2,3]})
 782   >>> deep_eq(x5, y5)
 783   True
 784   >>> x6, y6 = ({'a': [1,'b',8]}, {'a': [2,'b',8]})
 785   >>> deep_eq(x6, y6)
 786   False
 787   >>> x7, y7 = ('a', 'a')
 788   >>> deep_eq(x7, y7)
 789   True
 790   >>> x8, y8 = (['p','n',['asdf']], ['p','n',['asdf']])
 791   >>> deep_eq(x8, y8)
 792   True
 793   >>> x9, y9 = (['p','n',['asdf',['omg']]], ['p', 'n', ['asdf',['nowai']]])
 794   >>> deep_eq(x9, y9)
 795   False
 796   >>> x10, y10 = (1, 2)
 797   >>> deep_eq(x10, y10)
 798   False
 799   >>> deep_eq((str(p) for p in xrange(10)), (str(p) for p in xrange(10)))
 800   True
 801   >>> str(deep_eq(range(4), range(4)))
 802   'True'
 803   >>> deep_eq(xrange(100), xrange(100))
 804   True
 805   >>> deep_eq(xrange(2), xrange(5))
 806   False
 807   >>> from datetime import datetime, timedelta
 808   >>> d1, d2 = (datetime.now(), datetime.now() + timedelta(seconds=4))
 809   >>> deep_eq(d1, d2)
 810   False
 811   >>> deep_eq(d1, d2, datetime_fudge=timedelta(seconds=5))
 812   True
 813   """
 814   _deep_eq = functools.partial(deep_eq, datetime_fudge=datetime_fudge,
 815                                _assert=_assert)
 816
 817   def _check_assert(R, a, b, reason=''):
 818     if _assert and not R:
 819       assert 0, "an assertion has failed in deep_eq (%s) %s != %s" % (
 820         reason, str(a), str(b))
 821     return R
 822
 823   def _deep_dict_eq(d1, d2):
 824     k1, k2 = (sorted(d1.keys()), sorted(d2.keys()))
 825     if k1 != k2: # keys should be exactly equal
 826       return _check_assert(False, k1, k2, "keys")
 827
 828     return _check_assert(operator.eq(sum(_deep_eq(d1[k], d2[k])
 829                                        for k in k1),
 830                                      len(k1)), d1, d2, "dictionaries")
 831
 832   def _deep_iter_eq(l1, l2):
 833     if len(l1) != len(l2):
 834       return _check_assert(False, l1, l2, "lengths")
 835     return _check_assert(operator.eq(sum(_deep_eq(v1, v2)
 836                                       for v1, v2 in zip(l1, l2)),
 837                                      len(l1)), l1, l2, "iterables")
 838
 839   def op(a, b):
 840     _op = operator.eq
 841     if type(a) == datetime and type(b) == datetime:
 842       s = datetime_fudge.seconds
 843       t1, t2 = (time.mktime(a.timetuple()), time.mktime(b.timetuple()))
 844       l = t1 - t2
 845       l = -l if l > 0 else l
 846       return _check_assert((-s if s > 0 else s) <= l, a, b, "dates")
 847     return _check_assert(_op(a, b), a, b, "values")
 848
 849   c1, c2 = (_v1, _v2)
 850
 851   # guard against strings because they are iterable and their
 852   # elements yield iterables infinitely.
 853   # I N C E P T I O N
 854   for t in types.StringTypes:
 855     if isinstance(_v1, t):
 856       break
 857   else:
 858     if isinstance(_v1, types.DictType):
 859       op = _deep_dict_eq
 860     else:
 861       try:
 862         c1, c2 = (list(iter(_v1)), list(iter(_v2)))
 863       except TypeError:
 864         c1, c2 = _v1, _v2
 865       else:
 866         op = _deep_iter_eq
 867
 868   return op(c1, c2)
 869
 870
 871 def parse_request_body(request):
 872     """ returns the parsed request body, handles gzip encoding """
 873
 874     raw_body = request.body
 875     content_enc = request.META.get('HTTP_CONTENT_ENCODING')
 876
 877     if content_enc == 'gzip':
 878         raw_body = zlib.decompress(raw_body)
 879
 880     return json.loads(raw_body)