# HG changeset patch # User Artem Tikhomirov # Date 1303142664 -7200 # Node ID e2115da4cf6aca1580799bed56b60502db42b43c # Parent c9b305df0b890b6657285abb5ddbdeb902e5037a Pool objects to avoid memory polution with duplicates diff -r c9b305df0b89 -r e2115da4cf6a src/org/tmatesoft/hg/core/HgChangeset.java --- a/src/org/tmatesoft/hg/core/HgChangeset.java Fri Apr 15 05:17:44 2011 +0200 +++ b/src/org/tmatesoft/hg/core/HgChangeset.java Mon Apr 18 18:04:24 2011 +0200 @@ -64,7 +64,7 @@ /*package-local*/ void init(int localRevNumber, Nodeid nid, RawChangeset rawChangeset) { revNumber = localRevNumber; nodeid = nid; - changeset = rawChangeset; + changeset = rawChangeset.clone(); modifiedFiles = addedFiles = null; deletedFiles = null; parent1 = parent2 = null; @@ -169,7 +169,7 @@ public HgChangeset clone() { try { HgChangeset copy = (HgChangeset) super.clone(); - copy.changeset = changeset.clone(); + // copy.changeset references this.changeset, doesn't need own copy return copy; } catch (CloneNotSupportedException ex) { throw new InternalError(ex.toString()); diff -r c9b305df0b89 -r e2115da4cf6a src/org/tmatesoft/hg/internal/Pool.java --- a/src/org/tmatesoft/hg/internal/Pool.java Fri Apr 15 05:17:44 2011 +0200 +++ b/src/org/tmatesoft/hg/internal/Pool.java Mon Apr 18 18:04:24 2011 +0200 @@ -36,4 +36,18 @@ } return rv; } + + @Override + public String toString() { + StringBuilder sb = new StringBuilder(); + sb.append(Pool.class.getSimpleName()); + sb.append('<'); + if (!unify.isEmpty()) { + sb.append(unify.keySet().iterator().next().getClass().getName()); + } + sb.append('>'); + sb.append(':'); + sb.append(unify.size()); + return sb.toString(); + } } \ No newline at end of file diff -r c9b305df0b89 -r e2115da4cf6a src/org/tmatesoft/hg/repo/HgChangelog.java --- a/src/org/tmatesoft/hg/repo/HgChangelog.java Fri Apr 15 05:17:44 2011 +0200 +++ b/src/org/tmatesoft/hg/repo/HgChangelog.java Mon Apr 18 18:04:24 2011 +0200 @@ -30,8 +30,10 @@ import java.util.Map; import java.util.TimeZone; +import org.tmatesoft.hg.core.HgBadStateException; import org.tmatesoft.hg.core.Nodeid; import org.tmatesoft.hg.internal.DataAccess; +import org.tmatesoft.hg.internal.Pool; import org.tmatesoft.hg.internal.RevlogStream; /** @@ -51,28 +53,16 @@ } public void range(int start, int end, final HgChangelog.Inspector inspector) { - RevlogStream.Inspector i = new RevlogStream.Inspector() { - - public void next(int revisionNumber, int actualLen, int baseRevision, int linkRevision, int parent1Revision, int parent2Revision, byte[] nodeid, DataAccess da) { - RawChangeset cset = RawChangeset.parse(da); - // XXX there's no guarantee for Changeset.Callback that distinct instance comes each time, consider instance reuse - inspector.next(revisionNumber, Nodeid.fromBinary(nodeid, 0), cset); - } - }; - content.iterate(start, end, true, i); + if (inspector == null) { + throw new IllegalArgumentException(); + } + content.iterate(start, end, true, new RawCsetParser(inspector)); } public List range(int start, int end) { - final ArrayList rv = new ArrayList(end - start + 1); - RevlogStream.Inspector i = new RevlogStream.Inspector() { - - public void next(int revisionNumber, int actualLen, int baseRevision, int linkRevision, int parent1Revision, int parent2Revision, byte[] nodeid, DataAccess da) { - RawChangeset cset = RawChangeset.parse(da); - rv.add(cset); - } - }; - content.iterate(start, end, true, i); - return rv; + final RawCsetCollector c = new RawCsetCollector(end - start + 1); + range(start, end, c); + return c.result; } public void range(final HgChangelog.Inspector inspector, final int... revisions) { @@ -80,11 +70,11 @@ return; } RevlogStream.Inspector i = new RevlogStream.Inspector() { + private final RawCsetParser delegate = new RawCsetParser(inspector); public void next(int revisionNumber, int actualLen, int baseRevision, int linkRevision, int parent1Revision, int parent2Revision, byte[] nodeid, DataAccess da) { if (Arrays.binarySearch(revisions, revisionNumber) >= 0) { - RawChangeset cset = RawChangeset.parse(da); - inspector.next(revisionNumber, Nodeid.fromBinary(nodeid, 0), cset); + delegate.next(revisionNumber, actualLen, baseRevision, linkRevision, parent1Revision, parent2Revision, nodeid, da); } } }; @@ -206,14 +196,15 @@ try { byte[] data = da.byteArray(); RawChangeset rv = new RawChangeset(); - rv.init(data, 0, data.length); + rv.init(data, 0, data.length, null); return rv; } catch (IOException ex) { - throw new IllegalArgumentException(ex); // FIXME better handling of IOExc + throw new HgBadStateException(ex); // FIXME "Error reading changeset data" } } - /* package-local */void init(byte[] data, int offset, int length) { + // @param usersPool - it's likely user names get repeated again and again throughout repository. can be null + /* package-local */void init(byte[] data, int offset, int length, Pool usersPool) { final int bufferEndIndex = offset + length; final byte lineBreak = (byte) '\n'; int breakIndex1 = indexOf(data, lineBreak, offset, bufferEndIndex); @@ -226,6 +217,9 @@ throw new IllegalArgumentException("Bad Changeset data"); } String _user = new String(data, breakIndex1 + 1, breakIndex2 - breakIndex1 - 1); + if (usersPool != null) { + _user = usersPool.unify(_user); + } int breakIndex3 = indexOf(data, lineBreak, breakIndex2 + 1, bufferEndIndex); if (breakIndex3 == -1) { throw new IllegalArgumentException("Bad Changeset data"); @@ -312,4 +306,39 @@ } } + private static class RawCsetCollector implements Inspector { + final ArrayList result; + + public RawCsetCollector(int count) { + result = new ArrayList(count > 0 ? count : 5); + } + + public void next(int revisionNumber, Nodeid nodeid, RawChangeset cset) { + result.add(cset.clone()); + } + } + + private static class RawCsetParser implements RevlogStream.Inspector { + + private final Inspector inspector; + private final Pool usersPool; + private final RawChangeset cset = new RawChangeset(); + + public RawCsetParser(HgChangelog.Inspector delegate) { + assert delegate != null; + inspector = delegate; + usersPool = new Pool(); + } + + public void next(int revisionNumber, int actualLen, int baseRevision, int linkRevision, int parent1Revision, int parent2Revision, byte[] nodeid, DataAccess da) { + try { + byte[] data = da.byteArray(); + cset.init(data, 0, data.length, usersPool); + // XXX there's no guarantee for Changeset.Callback that distinct instance comes each time, consider instance reuse + inspector.next(revisionNumber, Nodeid.fromBinary(nodeid, 0), cset); + } catch (Exception ex) { + throw new HgBadStateException(ex); // FIXME exception handling + } + } + } } diff -r c9b305df0b89 -r e2115da4cf6a src/org/tmatesoft/hg/repo/HgManifest.java --- a/src/org/tmatesoft/hg/repo/HgManifest.java Fri Apr 15 05:17:44 2011 +0200 +++ b/src/org/tmatesoft/hg/repo/HgManifest.java Mon Apr 18 18:04:24 2011 +0200 @@ -21,6 +21,7 @@ import org.tmatesoft.hg.core.HgBadStateException; import org.tmatesoft.hg.core.Nodeid; import org.tmatesoft.hg.internal.DataAccess; +import org.tmatesoft.hg.internal.Pool; import org.tmatesoft.hg.internal.RevlogStream; @@ -36,50 +37,10 @@ } public void walk(int start, int end, final Inspector inspector) { - RevlogStream.Inspector insp = new RevlogStream.Inspector() { - - private boolean gtg = true; // good to go - - public void next(int revisionNumber, int actualLen, int baseRevision, int linkRevision, int parent1Revision, int parent2Revision, byte[] nodeid, DataAccess da) { - if (!gtg) { - return; - } - try { - gtg = gtg && inspector.begin(revisionNumber, new Nodeid(nodeid, true)); - int i; - String fname = null; - String flags = null; - Nodeid nid = null; - byte[] data = da.byteArray(); - for (i = 0; gtg && i < actualLen; i++) { - int x = i; - for( ; data[i] != '\n' && i < actualLen; i++) { - if (fname == null && data[i] == 0) { - fname = new String(data, x, i - x); - x = i+1; - } - } - if (i < actualLen) { - assert data[i] == '\n'; - int nodeidLen = i - x < 40 ? i-x : 40; - nid = Nodeid.fromAscii(data, x, nodeidLen); - if (nodeidLen + x < i) { - // 'x' and 'l' for executable bits and symlinks? - // hg --debug manifest shows 644 for each regular file in my repo - flags = new String(data, x + nodeidLen, i-x-nodeidLen); - } - gtg = gtg && inspector.next(nid, fname, flags); - } - nid = null; - fname = flags = null; - } - gtg = gtg && inspector.end(revisionNumber); - } catch (IOException ex) { - throw new HgBadStateException(ex); - } - } - }; - content.iterate(start, end, true, insp); + if (inspector == null) { + throw new IllegalArgumentException(); + } + content.iterate(start, end, true, new ManifestParser(inspector)); } public interface Inspector { @@ -87,4 +48,59 @@ boolean next(Nodeid nid, String fname, String flags); boolean end(int revision); } + + private static class ManifestParser implements RevlogStream.Inspector { + private boolean gtg = true; // good to go + private final Inspector inspector; + private final Pool nodeidPool; + private final Pool fnamePool; + private final Pool flagsPool; + + public ManifestParser(Inspector delegate) { + assert delegate != null; + inspector = delegate; + nodeidPool = new Pool(); + fnamePool = new Pool(); + flagsPool = new Pool(); + } + + public void next(int revisionNumber, int actualLen, int baseRevision, int linkRevision, int parent1Revision, int parent2Revision, byte[] nodeid, DataAccess da) { + if (!gtg) { + return; + } + try { + gtg = gtg && inspector.begin(revisionNumber, new Nodeid(nodeid, true)); + int i; + String fname = null; + String flags = null; + Nodeid nid = null; + byte[] data = da.byteArray(); + for (i = 0; gtg && i < actualLen; i++) { + int x = i; + for( ; data[i] != '\n' && i < actualLen; i++) { + if (fname == null && data[i] == 0) { + fname = fnamePool.unify(new String(data, x, i - x)); + x = i+1; + } + } + if (i < actualLen) { + assert data[i] == '\n'; + int nodeidLen = i - x < 40 ? i-x : 40; + nid = nodeidPool.unify(Nodeid.fromAscii(data, x, nodeidLen)); + if (nodeidLen + x < i) { + // 'x' and 'l' for executable bits and symlinks? + // hg --debug manifest shows 644 for each regular file in my repo + flags = flagsPool.unify(new String(data, x + nodeidLen, i-x-nodeidLen)); + } + gtg = gtg && inspector.next(nid, fname, flags); + } + nid = null; + fname = flags = null; + } + gtg = gtg && inspector.end(revisionNumber); + } catch (IOException ex) { + throw new HgBadStateException(ex); + } + } + } }