hg/gitweb: mercurial/revlog.py comparison

comparison mercurial/revlog.py @ 2255:3f38e872f39a

Reduce ram used for very large inlined index files During a clone, an inline index is not converted to a split index file until the very end. When the conversion happens, the index can be very large, and the inline index loading functions always load the entire index file into ram. This changes the revlog code to read the index in smaller chunks.

author	mason@suse.com
date	Wed, 10 May 2006 15:26:56 -0700
parents	45aef5ddcdbe
children	854954fd410a

comparison

equal deleted inserted replaced

-:827fcfe88b14
+:3f38e872f39a
 # big index, let's parse it on demand
 parser = lazyparser(f, st.st_size, self.indexformat, shaoffset)
 self.index = lazyindex(parser)
 self.nodemap = lazymap(parser)
 else:
-i = f.read()
+self.parseindex(f, st)
-self.parseindex(i)
-if self.inlinedata():
-# we've already got the entire data file read in, save it
-# in the chunk data
-self.chunkcache = (0, i)
 if self.version != REVLOGV0:
 e = list(self.index[0])
 type = self.ngtype(e[0])
 e[0] = self.offset_type(0, type)
 self.index[0] = e
 else:
 self.nodemap = { nullid: -1}
 self.index = []
-def parseindex(self, data):
+def parseindex(self, fp, st):
 s = struct.calcsize(self.indexformat)
-l = len(data)
 self.index = []
 self.nodemap =  {nullid: -1}
 inline = self.inlinedata()
-off = 0
 n = 0
-while off < l:
+leftover = None
-e = struct.unpack(self.indexformat, data[off:off + s])
+while True:
-self.index.append(e)
+if st:
-self.nodemap[e[-1]] = n
+data = fp.read(65536)
-n += 1
+else:
-off += s
+# hack for httprangereader, it doesn't do partial reads well
-if inline:
+data = fp.read()
-off += e[1]
+if not data:
+break
+if n == 0 and self.inlinedata():
+# cache the first chunk
+self.chunkcache = (0, data)
+off = 0
+l = len(data)
+while off < l:
+if l - off < s:
+leftover = data[off:]
+break
+if leftover:
+cur = leftover + data[off:off + s - len(leftover)]
+off += s - len(leftover)
+leftover = None
+else:
+cur = data[off:off + s]
+off += s
+e = struct.unpack(self.indexformat, cur)
+self.index.append(e)
+self.nodemap[e[-1]] = n
+n += 1
+if inline:
+off += e[1]
+if off > l:
+# some things don't seek well, just read it
+fp.read(off - l)
+if not st:
+break
 def ngoffset(self, q):
 if q & 0xFFFF:
 raise RevlogError(_('%s: incompatible revision flag %x') %
 (self.indexfile, q))

Mercurial > hg > gitweb

comparison mercurial/revlog.py @ 2255:3f38e872f39a