mercurial-scm/hg-stable: mercurial/util.py comparison

comparison mercurial/util.py @ 11758:a79214972da2 stable

chunkbuffer: use += rather than cStringIO to reduce memory footprint This significantly refactors the read() loop to use a queue of chunks. The queue is alternately filled to at least 256k and then emptied by concatenating onto the output buffer. For very large read sizes, += uses less memory because it can resize the target string in place.

author	Matt Mackall <mpm@selenic.com>
date	Fri, 06 Aug 2010 12:18:33 -0500
parents	c37f35d7f2f5
children	05deba16c5d5 ff5cec76b1c5

comparison

equal deleted inserted replaced

-:65bd4b8e48bd
+:a79214972da2
 hide platform-specific details from the core.
 """
 from i18n import _
 import error, osutil, encoding
-import cStringIO, errno, re, shutil, sys, tempfile, traceback
+import errno, re, shutil, sys, tempfile, traceback
 import os, stat, time, calendar, textwrap, unicodedata, signal
 import imp
 # Python compatibility
 def __init__(self, in_iter):
 """in_iter is the iterator that's iterating over the input chunks.
 targetsize is how big a buffer to try to maintain."""
 self.iter = iter(in_iter)
-self.buf = ''
+self._queue = []
-self.targetsize = 2**16
 def read(self, l):
 """Read L bytes of data from the iterator of chunks of data.
 Returns less than L bytes if the iterator runs dry."""
-if l > len(self.buf) and self.iter:
+left = l
-# Clamp to a multiple of self.targetsize
+buf = ''
-targetsize = max(l, self.targetsize)
+queue = self._queue
-collector = cStringIO.StringIO()
+while left > 0:
-collector.write(self.buf)
+# refill the queue
-collected = len(self.buf)
+if not queue:
-for chunk in self.iter:
+target = 2**18
-collector.write(chunk)
+for chunk in self.iter:
-collected += len(chunk)
+queue.append(chunk)
-if collected >= targetsize:
+target -= len(chunk)
+if target <= 0:
+break
+if not queue:
 break
-if collected < targetsize:
-self.iter = False
+chunk = queue.pop(0)
-self.buf = collector.getvalue()
+left -= len(chunk)
-if len(self.buf) == l:
+if left < 0:
-s, self.buf = str(self.buf), ''
+queue.insert(0, chunk[left:])
-else:
+buf += chunk[:left]
-s, self.buf = self.buf[:l], buffer(self.buf, l)
+else:
-return s
+buf += chunk
+return buf
 def filechunkiter(f, size=65536, limit=None):
 """Create a generator that produces the data in the file size
 (default 65536) bytes at a time, up to optional limit (default is
 to read all data).  Chunks may be less than size bytes if the

Mercurial > public > mercurial-scm > hg-stable

comparison mercurial/util.py @ 11758:a79214972da2 stable