# HG changeset patch # User Gregory Szorc # Date 1444091792 25200 # Node ID 6ae14d1ca3aa7929338f57c4f308aaca88b4d108 # Parent 46143f31290e489181a1a88a1ef42ccfad17a489 util.chunkbuffer: avoid extra mutations when reading partial chunks Previously, a read(N) where N was less than the length of the first available chunk would mutate the deque instance twice and allocate a new str from the slice of the existing chunk. Profiling drawed my attention to these as a potential hot spot during changegroup reading. This patch makes the code more complicated in order to avoid the aforementioned 3 operations. On a pre-generated mozilla-central gzip bundle, this series has the following impact on `hg unbundle` performance on my MacBook Pro: before: 358.21 real 317.69 user 38.49 sys after: 301.57 real 262.69 user 37.11 sys delta: -56.64 real -55.00 user -1.38 sys diff -r 46143f31290e -r 6ae14d1ca3aa mercurial/util.py --- a/mercurial/util.py Mon Oct 05 16:34:47 2015 -0700 +++ b/mercurial/util.py Mon Oct 05 17:36:32 2015 -0700 @@ -1286,6 +1286,7 @@ yield chunk self.iter = splitbig(in_iter) self._queue = collections.deque() + self._chunkoffset = 0 def read(self, l=None): """Read L bytes of data from the iterator of chunks of data. @@ -1310,20 +1311,40 @@ if not queue: break + # The easy way to do this would be to queue.popleft(), modify the + # chunk (if necessary), then queue.appendleft(). However, for cases + # where we read partial chunk content, this incurs 2 dequeue + # mutations and creates a new str for the remaining chunk in the + # queue. Our code below avoids this overhead. + chunk = queue[0] chunkl = len(chunk) + offset = self._chunkoffset # Use full chunk. - if left >= chunkl: + if offset == 0 and left >= chunkl: left -= chunkl queue.popleft() buf.append(chunk) + # self._chunkoffset remains at 0. + continue + + chunkremaining = chunkl - offset + + # Use all of unconsumed part of chunk. + if left >= chunkremaining: + left -= chunkremaining + queue.popleft() + # offset == 0 is enabled by block above, so this won't merely + # copy via ``chunk[0:]``. + buf.append(chunk[offset:]) + self._chunkoffset = 0 + # Partial chunk needed. else: - left -= chunkl - queue.popleft() - queue.appendleft(chunk[left:]) - buf.append(chunk[:left]) + buf.append(chunk[offset:offset + left]) + self._chunkoffset += left + left -= chunkremaining return ''.join(buf)