changeset 534:243202f1bda5

Commit: refactor revision creation code from clone command to work separately, fit into existing library structure
author Artem Tikhomirov <tikhomirov.artem@gmail.com>
date Mon, 04 Feb 2013 18:00:55 +0100 (2013-02-04)
parents e6f72c9829a6
children d9c07e1432c4
files src/org/tmatesoft/hg/core/HgCloneCommand.java src/org/tmatesoft/hg/internal/DataAccessProvider.java src/org/tmatesoft/hg/internal/DataSerializer.java src/org/tmatesoft/hg/internal/DeflaterDataSerializer.java src/org/tmatesoft/hg/internal/DirstateReader.java src/org/tmatesoft/hg/internal/Patch.java src/org/tmatesoft/hg/internal/RevlogCompressor.java src/org/tmatesoft/hg/internal/RevlogStream.java src/org/tmatesoft/hg/internal/RevlogStreamWriter.java src/org/tmatesoft/hg/repo/HgBundle.java src/org/tmatesoft/hg/repo/Revlog.java test/org/tmatesoft/hg/test/TestCommit.java
diffstat 12 files changed, 591 insertions(+), 74 deletions(-) [+]
line wrap: on
line diff
--- a/src/org/tmatesoft/hg/core/HgCloneCommand.java	Wed Jan 30 15:48:36 2013 +0100
+++ b/src/org/tmatesoft/hg/core/HgCloneCommand.java	Mon Feb 04 18:00:55 2013 +0100
@@ -18,6 +18,8 @@
 
 import static org.tmatesoft.hg.core.Nodeid.NULL;
 import static org.tmatesoft.hg.internal.RequiresFile.*;
+import static org.tmatesoft.hg.internal.RevlogStreamWriter.preferCompleteOverPatch;
+import static org.tmatesoft.hg.internal.RevlogStreamWriter.preferCompressedOverComplete;
 
 import java.io.File;
 import java.io.FileOutputStream;
@@ -29,6 +31,8 @@
 
 import org.tmatesoft.hg.internal.ByteArrayDataAccess;
 import org.tmatesoft.hg.internal.DataAccess;
+import org.tmatesoft.hg.internal.DataAccessProvider;
+import org.tmatesoft.hg.internal.DataSerializer;
 import org.tmatesoft.hg.internal.DigestHelper;
 import org.tmatesoft.hg.internal.Lifecycle;
 import org.tmatesoft.hg.internal.RepoInitializer;
@@ -139,6 +143,7 @@
 		private final PathRewrite storagePathHelper;
 		private final ProgressSupport progressSupport;
 		private final CancelSupport cancelSupport;
+		private final SessionContext ctx;
 		private FileOutputStream indexFile;
 		private String filename; // human-readable name of the file being written, for log/exception purposes 
 
@@ -155,13 +160,18 @@
 		private Lifecycle.Callback lifecycleCallback;
 		private CancelledException cancelException;
 
-		public WriteDownMate(SessionContext ctx, File destDir, ProgressSupport progress, CancelSupport cancel) {
+		private RevlogStreamWriter.HeaderWriter revlogHeader = new RevlogStreamWriter.HeaderWriter(true);
+		private RevlogCompressor revlogDataZip;
+
+		public WriteDownMate(SessionContext sessionCtx, File destDir, ProgressSupport progress, CancelSupport cancel) {
+			ctx = sessionCtx;
 			hgDir = new File(destDir, ".hg");
 			repoInit = new RepoInitializer();
 			repoInit.setRequires(STORE | FNCACHE | DOTENCODE);
-			storagePathHelper = repoInit.buildDataFilesHelper(ctx);
+			storagePathHelper = repoInit.buildDataFilesHelper(sessionCtx);
 			progressSupport = progress;
 			cancelSupport = cancel;
+			revlogDataZip = new RevlogCompressor(sessionCtx);
 		}
 
 		public void initEmptyRepository() throws IOException {
@@ -278,9 +288,6 @@
 			throw new HgInvalidControlFileException(m, null, new File(hgDir, filename)).setRevision(p);
 		}
 		
-		private RevlogStreamWriter.HeaderWriter revlogHeader = new RevlogStreamWriter.HeaderWriter(true);
-		private RevlogCompressor revlogDataZip = new RevlogCompressor();
-
 		public boolean element(GroupElement ge) {
 			try {
 				assert indexFile != null;
@@ -332,7 +339,7 @@
 				byte[] patchContent = ge.rawDataByteArray();
 				// no reason to keep patch if it's close (here, >75%) in size to the complete contents,
 				// save patching effort in this case
-				writeComplete = writeComplete || patchContent.length >= (/* 3/4 of actual */content.length - (content.length >>> 2));
+				writeComplete = writeComplete || preferCompleteOverPatch(patchContent.length, content.length);
 
 				if (writeComplete) {
 					revlogHeader.baseRevision(revisionSequence.size());
@@ -340,29 +347,37 @@
 				assert revlogHeader.baseRevision() >= 0;
 
 				final byte[] sourceData = writeComplete ? content : patchContent;
-				revlogDataZip.reset(sourceData);
+				revlogDataZip.reset(new DataSerializer.ByteArrayDataSource(sourceData));
 				final int compressedLen;
-				final boolean useUncompressedData = revlogDataZip.getCompressedLengthEstimate() >= (sourceData.length - (sourceData.length >>> 2));
+				final boolean useUncompressedData = preferCompressedOverComplete(revlogDataZip.getCompressedLength(), sourceData.length);
 				if (useUncompressedData) {
 					// compression wasn't too effective,
 					compressedLen = sourceData.length + 1 /*1 byte for 'u' - uncompressed prefix byte*/;
 				} else {
-					compressedLen= revlogDataZip.getCompressedLengthEstimate();
+					compressedLen= revlogDataZip.getCompressedLength();
 				}
 		
 				revlogHeader.length(content.length, compressedLen);
 				
-				revlogHeader.write(indexFile);
+				// XXX may be wise not to create DataSerializer for each revision, but for a file
+				DataAccessProvider.StreamDataSerializer sds = new DataAccessProvider.StreamDataSerializer(ctx.getLog(), indexFile) {
+					@Override
+					public void done() {
+						// override parent behavior not to close stream in use
+					}
+				};
+				revlogHeader.serialize(sds);
 
 				if (useUncompressedData) {
 					indexFile.write((byte) 'u');
 					indexFile.write(sourceData);
 				} else {
-					int actualCompressedLenWritten = revlogDataZip.writeCompressedData(indexFile);
+					int actualCompressedLenWritten = revlogDataZip.writeCompressedData(sds);
 					if (actualCompressedLenWritten != compressedLen) {
 						throw new HgInvalidStateException(String.format("Expected %d bytes of compressed data, but actually wrote %d in %s", compressedLen, actualCompressedLenWritten, filename));
 					}
 				}
+				sds.done();
 				//
 				revisionSequence.add(node);
 				prevRevContent.done();
--- a/src/org/tmatesoft/hg/internal/DataAccessProvider.java	Wed Jan 30 15:48:36 2013 +0100
+++ b/src/org/tmatesoft/hg/internal/DataAccessProvider.java	Mon Feb 04 18:00:55 2013 +0100
@@ -21,7 +21,10 @@
 
 import java.io.File;
 import java.io.FileInputStream;
+import java.io.FileNotFoundException;
+import java.io.FileOutputStream;
 import java.io.IOException;
+import java.io.OutputStream;
 import java.nio.ByteBuffer;
 import java.nio.MappedByteBuffer;
 import java.nio.channels.FileChannel;
@@ -72,7 +75,7 @@
 		return mapioBoundary == 0 ? Integer.MAX_VALUE : mapioBoundary;
 	}
 
-	public DataAccess create(File f) {
+	public DataAccess createReader(File f) {
 		if (!f.exists()) {
 			return new DataAccess();
 		}
@@ -96,6 +99,22 @@
 		}
 		return new DataAccess(); // non-null, empty.
 	}
+	
+	public DataSerializer createWriter(File f, boolean createNewIfDoesntExist) {
+		if (!f.exists() && !createNewIfDoesntExist) {
+			return new DataSerializer();
+		}
+		try {
+			return new StreamDataSerializer(context.getLog(), new FileOutputStream(f));
+		} catch (final FileNotFoundException ex) {
+			context.getLog().dump(getClass(), Error, ex, null);
+			return new DataSerializer() {
+				public void write(byte[] data, int offset, int length) throws IOException {
+					throw ex;
+				}
+			};
+		}
+	}
 
 	private static class MemoryMapFileAccess extends DataAccess {
 		private FileChannel fileChannel;
@@ -374,4 +393,57 @@
 			}
 		}
 	}
+
+	public/*XXX, private, once HgCloneCommand stops using it */ static class StreamDataSerializer extends DataSerializer {
+		private final OutputStream out;
+		private final LogFacility log;
+		private byte[] buffer;
+	
+		public StreamDataSerializer(LogFacility logFacility, OutputStream os) {
+			assert os != null;
+			out = os;
+			log = logFacility;
+		}
+		
+		@Override
+		public void write(byte[] data, int offset, int length) throws IOException {
+			out.write(data, offset, length);
+		}
+	
+		@Override
+		public void writeInt(int... values) throws IOException {
+			ensureBufferSize(4*values.length); // sizeof(int)
+			int idx = 0;
+			for (int v : values) {
+				DataSerializer.bigEndian(v, buffer, idx);
+				idx += 4;
+			}
+			out.write(buffer, 0, idx);
+		}
+		
+		@Override
+		public void writeByte(byte... values) throws IOException {
+			if (values.length == 1) {
+				out.write(values[0]);
+			} else {
+				out.write(values, 0, values.length);
+			}
+		}
+		
+		private void ensureBufferSize(int bytesNeeded) {
+			if (buffer == null || buffer.length < bytesNeeded) {
+				buffer = new byte[bytesNeeded];
+			}
+		}
+	
+		@Override
+		public void done() {
+			try {
+				out.flush();
+				out.close();
+			} catch (IOException ex) {
+				log.dump(getClass(), Error, ex, "Failure to close stream");
+			}
+		}
+	}
 }
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/src/org/tmatesoft/hg/internal/DataSerializer.java	Mon Feb 04 18:00:55 2013 +0100
@@ -0,0 +1,92 @@
+/*
+ * Copyright (c) 2013 TMate Software Ltd
+ *  
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; version 2 of the License.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * For information on how to redistribute this software under
+ * the terms of a license other than GNU General Public License
+ * contact TMate Software at support@hg4j.com
+ */
+package org.tmatesoft.hg.internal;
+
+import java.io.IOException;
+
+/**
+ * Serialization friend of {@link DataAccess}
+ * 
+ * @author Artem Tikhomirov
+ * @author TMate Software Ltd.
+ */
+@Experimental(reason="Work in progress")
+public class DataSerializer {
+	
+	public void writeByte(byte... values) throws IOException {
+		write(values, 0, values.length);
+	}
+
+	public void writeInt(int... values) throws IOException {
+		byte[] buf = new byte[4];
+		for (int v : values) {
+			bigEndian(v, buf, 0);
+			write(buf, 0, buf.length);
+		}
+	}
+
+	public void write(byte[] data, int offset, int length) throws IOException {
+		throw new IOException("Attempt to write to non-existent file");
+	}
+
+	public void done() {
+		// FIXME perhaps, shall allow IOException, too
+		// no-op
+	}
+	
+	/**
+	 * Writes 4 bytes of supplied value into the buffer at given offset, big-endian. 
+	 */
+	public static final void bigEndian(int value, byte[] buffer, int offset) {
+		assert offset + 4 <= buffer.length; 
+		buffer[offset++] = (byte) ((value >>> 24) & 0x0ff);
+		buffer[offset++] = (byte) ((value >>> 16) & 0x0ff);
+		buffer[offset++] = (byte) ((value >>> 8) & 0x0ff);
+		buffer[offset++] = (byte) (value & 0x0ff);
+	}
+	
+	@Experimental(reason="Work in progress")
+	interface DataSource {
+		public void serialize(DataSerializer out) throws IOException;
+
+		/**
+		 * Hint of data length it would like to writes
+		 * @return -1 if can't answer
+		 */
+		public int serializeLength();
+	}
+	
+	public static class ByteArrayDataSource implements DataSource {
+		
+		private final byte[] data;
+
+		public ByteArrayDataSource(byte[] bytes) {
+			data = bytes;
+		}
+
+		public void serialize(DataSerializer out) throws IOException {
+			if (data != null) {
+				out.write(data, 0, data.length);
+			}
+		}
+
+		public int serializeLength() {
+			return data == null ? 0 : data.length;
+		}
+		
+	}
+}
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/src/org/tmatesoft/hg/internal/DeflaterDataSerializer.java	Mon Feb 04 18:00:55 2013 +0100
@@ -0,0 +1,96 @@
+/*
+ * Copyright (c) 2013 TMate Software Ltd
+ *  
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; version 2 of the License.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * For information on how to redistribute this software under
+ * the terms of a license other than GNU General Public License
+ * contact TMate Software at support@hg4j.com
+ */
+package org.tmatesoft.hg.internal;
+
+import java.io.IOException;
+import java.util.zip.Deflater;
+import java.util.zip.DeflaterOutputStream;
+
+/**
+ * {@link DeflaterOutputStream} counterpart for {@link DataSerializer} API
+ * 
+ * @author Artem Tikhomirov
+ * @author TMate Software Ltd.
+ */
+class DeflaterDataSerializer extends DataSerializer {
+	
+	private static final int AUX_BUFFER_CAPACITY = 5; // room for 5 ints
+
+	private final DataSerializer delegate;
+	private final Deflater deflater;
+	private final byte[] deflateOutBuffer;
+	private final byte[] auxBuffer;
+
+	public DeflaterDataSerializer(DataSerializer delegateSerializer, Deflater def, int bufferSizeHint) {
+		delegate = delegateSerializer;
+		deflater = def;
+		deflateOutBuffer = new byte[bufferSizeHint <= 0 ? 2048 : bufferSizeHint];
+		auxBuffer = new byte[4 * AUX_BUFFER_CAPACITY]; // sizeof(int) * capacity
+	}
+
+	@Override
+	public void writeInt(int... values) throws IOException {
+		for (int i = 0; i < values.length; i+= AUX_BUFFER_CAPACITY) {
+			int idx = 0;
+			for (int j = i, x = Math.min(values.length, i + AUX_BUFFER_CAPACITY); j < x; j++) {
+				int v = values[j];
+				auxBuffer[idx++] = (byte) ((v >>> 24) & 0x0ff);
+				auxBuffer[idx++] = (byte) ((v >>> 16) & 0x0ff);
+				auxBuffer[idx++] = (byte) ((v >>> 8) & 0x0ff);
+				auxBuffer[idx++] = (byte) (v & 0x0ff);
+			}
+			internalWrite(auxBuffer, 0, idx);
+		}
+	}
+
+	@Override
+	public void write(byte[] data, int offset, int length) throws IOException {
+		// @see DeflaterOutputStream#write(byte[], int, int)
+		int stride = deflateOutBuffer.length;
+		for (int i = 0; i < length; i += stride) {
+			internalWrite(data, offset + i, Math.min(stride, length - i));
+		}
+	}
+	
+	private void internalWrite(byte[] data, int offset, int length) throws IOException {
+		deflater.setInput(data, offset, length);
+		while (!deflater.needsInput()) {
+			deflate();
+		}
+	}
+
+	@Override
+	public void done() {
+		delegate.done();
+	}
+
+	public void finish() throws IOException {
+		if (!deflater.finished()) {
+			deflater.finish();
+			while (!deflater.finished()) {
+				deflate();
+			}
+		}
+	}
+
+	protected void deflate() throws IOException {
+		int len = deflater.deflate(deflateOutBuffer, 0, deflateOutBuffer.length);
+		if (len > 0) {
+			delegate.write(deflateOutBuffer, 0, len);
+		}
+	}
+}
--- a/src/org/tmatesoft/hg/internal/DirstateReader.java	Wed Jan 30 15:48:36 2013 +0100
+++ b/src/org/tmatesoft/hg/internal/DirstateReader.java	Mon Feb 04 18:00:55 2013 +0100
@@ -66,7 +66,7 @@
 		if (dirstateFile == null || !dirstateFile.exists()) {
 			return;
 		}
-		DataAccess da = repo.getDataAccess().create(dirstateFile);
+		DataAccess da = repo.getDataAccess().createReader(dirstateFile);
 		try {
 			if (da.isEmpty()) {
 				return;
@@ -142,7 +142,7 @@
 		if (dirstateFile == null || !dirstateFile.exists()) {
 			return new Pair<Nodeid,Nodeid>(NULL, NULL);
 		}
-		DataAccess da = internalRepo.getDataAccess().create(dirstateFile);
+		DataAccess da = internalRepo.getDataAccess().createReader(dirstateFile);
 		try {
 			if (da.isEmpty()) {
 				return new Pair<Nodeid,Nodeid>(NULL, NULL);
--- a/src/org/tmatesoft/hg/internal/Patch.java	Wed Jan 30 15:48:36 2013 +0100
+++ b/src/org/tmatesoft/hg/internal/Patch.java	Mon Feb 04 18:00:55 2013 +0100
@@ -154,7 +154,29 @@
 		ends.add(e);
 		data.add(src);
 	}
-
+	
+	/**
+	 * @return how many bytes the patch would take if written down using BundleFormat structure (start, end, length, data)
+	 */
+	public int serializedLength() {
+		int totalDataLen = 0;
+		for (byte[] d : data) {
+			totalDataLen += d.length;
+		}
+		int prefix = 3 * 4 * count(); // 3 integer fields per entry * sizeof(int) * number of entries
+		return prefix + totalDataLen;
+	}
+	
+	/*package-local*/ void serialize(DataSerializer out) throws IOException {
+		for (int i = 0, x = data.size(); i < x; i++) {
+			final int start = starts.get(i);
+			final int end = ends.get(i);
+			byte[] d = data.get(i);
+			out.writeInt(start, end, d.length);
+			out.write(d, 0, d.length);
+		}
+	}
+	
 	private void add(Patch p, int i) {
 		add(p.starts.get(i), p.ends.get(i), p.data.get(i));
 	}
@@ -363,4 +385,15 @@
 		};
 		return r;
 	}
+
+	public class PatchDataSource implements DataSerializer.DataSource {
+
+		public void serialize(DataSerializer out) throws IOException {
+			Patch.this.serialize(out);
+		}
+
+		public int serializeLength() {
+			return Patch.this.serializedLength();
+		}
+	}
 }
\ No newline at end of file
--- a/src/org/tmatesoft/hg/internal/RevlogCompressor.java	Wed Jan 30 15:48:36 2013 +0100
+++ b/src/org/tmatesoft/hg/internal/RevlogCompressor.java	Mon Feb 04 18:00:55 2013 +0100
@@ -17,9 +17,10 @@
 package org.tmatesoft.hg.internal;
 
 import java.io.IOException;
-import java.io.OutputStream;
 import java.util.zip.Deflater;
-import java.util.zip.DeflaterOutputStream;
+
+import org.tmatesoft.hg.core.SessionContext;
+import org.tmatesoft.hg.util.LogFacility.Severity;
 
 /**
  * 
@@ -27,45 +28,59 @@
  * @author TMate Software Ltd.
  */
 public class RevlogCompressor {
+	private final SessionContext ctx;
 	private final Deflater zip;
-	private byte[] sourceData;
-	private int compressedLenEstimate;
+	private DataSerializer.DataSource sourceData;
+	private int compressedLen;
 	
-	public RevlogCompressor() {
+	public RevlogCompressor(SessionContext sessionCtx) {
+		ctx = sessionCtx;
 		zip = new Deflater();
 	}
 
-	public void reset(byte[] source) {
+	public void reset(DataSerializer.DataSource source) {
 		sourceData = source;
-		compressedLenEstimate = -1;
+		compressedLen = -1;
 	}
 	
-	public int writeCompressedData(OutputStream out) throws IOException {
+	// out stream is not closed!
+	public int writeCompressedData(DataSerializer out) throws IOException {
 		zip.reset();
-		DeflaterOutputStream dos = new DeflaterOutputStream(out, zip, Math.min(2048, sourceData.length));
-		dos.write(sourceData);
-		dos.finish();
+		DeflaterDataSerializer dds = new DeflaterDataSerializer(out, zip, sourceData.serializeLength());
+		sourceData.serialize(dds);
+		dds.finish();
 		return zip.getTotalOut();
 	}
 
-	public int getCompressedLengthEstimate() {
-		if (compressedLenEstimate != -1) {
-			return compressedLenEstimate;
+	public int getCompressedLength() {
+		if (compressedLen != -1) {
+			return compressedLen;
 		}
-		zip.reset();
-		int rv = 0;
-		// from DeflaterOutputStream:
-		byte[] buffer = new byte[Math.min(2048, sourceData.length)];
-        for (int i = 0, stride = buffer.length; i < sourceData.length; i+= stride) {
-            zip.setInput(sourceData, i, Math.min(stride, sourceData.length - i));
-            while (!zip.needsInput()) {
-            	rv += zip.deflate(buffer, 0, buffer.length);
-            }
-        }
-        zip.finish();
-        while (!zip.finished()) {
-        	rv += zip.deflate(buffer, 0, buffer.length);
-        }
-        return compressedLenEstimate = rv;
+		Counter counter = new Counter();
+		try {
+			compressedLen = writeCompressedData(counter);
+			assert counter.totalWritten == compressedLen;
+	        return compressedLen;
+		} catch (IOException ex) {
+			// can't happen provided we write to our stream that does nothing but byte counting
+			ctx.getLog().dump(getClass(), Severity.Error, ex, "Failed estimating compressed length of revlog data");
+			return counter.totalWritten; // use best known value so far
+		}
+	}
+
+	private static class Counter extends DataSerializer {
+		public int totalWritten = 0;
+
+		public void writeByte(byte... values) throws IOException {
+			totalWritten += values.length;
+		}
+
+		public void writeInt(int... values) throws IOException {
+			totalWritten += 4 * values.length;
+		}
+
+		public void write(byte[] data, int offset, int length) throws IOException {
+			totalWritten += length;
+		}
 	}
 }
--- a/src/org/tmatesoft/hg/internal/RevlogStream.java	Wed Jan 30 15:48:36 2013 +0100
+++ b/src/org/tmatesoft/hg/internal/RevlogStream.java	Mon Feb 04 18:00:55 2013 +0100
@@ -67,13 +67,21 @@
 	}
 
 	/*package*/ DataAccess getIndexStream() {
-		// TODO post 1.0 may supply a hint that I'll need really few bytes of data (perhaps, at some offset) 
+		// FIXME post 1.0 must supply a hint that I'll need really few bytes of data (perhaps, at some offset) 
 		// to avoid mmap files when only few bytes are to be read (i.e. #dataLength())
-		return dataAccess.create(indexFile);
+		return dataAccess.createReader(indexFile);
 	}
 
 	/*package*/ DataAccess getDataStream() {
-		return dataAccess.create(getDataFile());
+		return dataAccess.createReader(getDataFile());
+	}
+	
+	/*package*/ DataSerializer getIndexStreamWriter() {
+		return dataAccess.createWriter(indexFile, true);
+	}
+	
+	/*package*/ DataSerializer getDataStreamWriter() {
+		return dataAccess.createWriter(getDataFile(), true);
 	}
 	
 	/**
@@ -99,7 +107,21 @@
 		// although honest approach is to call #initOutline() first
 		return ex.setFile(inline ? indexFile : getDataFile());
 	}
+	
+	/*package-private*/String getDataFileName() {
+		// XXX a temporary solution to provide more info to fill in exceptions other than 
+		// HgInvalidControlFileException (those benefit from initWith* methods above)
+		//
+		// Besides, since RevlogStream represents both revlogs with user data (those with WC representative and 
+		// system data under store/data) and system-only revlogs (like changelog and manifest), there's no
+		// easy way to supply human-friendly name of the active file (independent from whether it's index of data)
+		return inline ? indexFile.getPath() : getDataFile().getPath();
+	}
 
+	public boolean isInlineData() {
+		initOutline();
+		return inline;
+	}
 	
 	public int revisionCount() {
 		initOutline();
--- a/src/org/tmatesoft/hg/internal/RevlogStreamWriter.java	Wed Jan 30 15:48:36 2013 +0100
+++ b/src/org/tmatesoft/hg/internal/RevlogStreamWriter.java	Mon Feb 04 18:00:55 2013 +0100
@@ -17,16 +17,19 @@
 package org.tmatesoft.hg.internal;
 
 import static org.tmatesoft.hg.internal.Internals.REVLOGV1_RECORD_SIZE;
+import static org.tmatesoft.hg.repo.HgRepository.NO_REVISION;
 
 import java.io.IOException;
-import java.io.OutputStream;
 import java.nio.ByteBuffer;
 
 import org.tmatesoft.hg.core.Nodeid;
+import org.tmatesoft.hg.core.SessionContext;
+import org.tmatesoft.hg.repo.HgInvalidControlFileException;
+import org.tmatesoft.hg.repo.HgInvalidStateException;
 
 /**
  * 
- * TODO check if index is too big and split into index+data
+ * TODO separate operation to check if index is too big and split into index+data
  * 
  * @author Artem Tikhomirov
  * @author TMate Software Ltd.
@@ -34,13 +37,14 @@
 public class RevlogStreamWriter {
 
 	
-	public static class HeaderWriter {
+	/*XXX public because HgCloneCommand uses it*/
+	public static class HeaderWriter implements DataSerializer.DataSource {
 		private final ByteBuffer header;
 		private final boolean isInline;
 		private long offset;
 		private int length, compressedLength;
 		private int baseRev, linkRev, p1, p2;
-		private Nodeid nodeid;
+		private byte[] nodeid;
 		
 		public HeaderWriter(boolean inline) {
 			isInline = inline;
@@ -74,16 +78,21 @@
 		}
 		
 		public HeaderWriter linkRevision(int linkRevision) {
-			this.linkRev = linkRevision;
+			linkRev = linkRevision;
 			return this;
 		}
 		
 		public HeaderWriter nodeid(Nodeid n) {
-			this.nodeid = n;
+			nodeid = n.toByteArray();
 			return this;
 		}
-
-		public void write(OutputStream out) throws IOException {
+		
+		public HeaderWriter nodeid(byte[] nodeidBytes) {
+			nodeid = nodeidBytes;
+			return this;
+		}
+		
+		public void serialize(DataSerializer out) throws IOException {
 			header.clear();
 			if (offset == 0) {
 				int version = 1 /* RevlogNG */;
@@ -102,34 +111,161 @@
 			header.putInt(linkRev);
 			header.putInt(p1);
 			header.putInt(p2);
-			header.put(nodeid.toByteArray());
+			header.put(nodeid);
 			// assume 12 bytes left are zeros
-			out.write(header.array());
+			out.write(header.array(), 0, header.capacity());
 
 			// regardless whether it's inline or separate data,
 			// offset field always represent cumulative compressedLength 
 			// (while offset in the index file with inline==true differs by n*sizeof(header), where n is entry's position in the file) 
 			offset += compressedLength;
 		}
+		
+		public int serializeLength() {
+			return header.capacity();
+		}
+	}
+
+	private final DigestHelper dh = new DigestHelper();
+	private final RevlogCompressor revlogDataZip;
+	
+	
+	public RevlogStreamWriter(SessionContext ctx, RevlogStream stream) {
+		revlogDataZip = new RevlogCompressor(ctx);
 	}
 	
-	
-	private final DigestHelper dh = new DigestHelper();
+	private int lastEntryBase, lastEntryIndex;
+	private byte[] lastEntryContent;
+	private Nodeid lastEntryRevision;
+	private IntMap<Nodeid> revisionCache = new IntMap<Nodeid>(32);
 	
 	public void addRevision(byte[] content, int linkRevision, int p1, int p2) {
-		Nodeid p1Rev = parent(p1);
-		Nodeid p2Rev = parent(p2);
-		byte[] revisionBytes = dh.sha1(p1Rev, p2Rev, content).asBinary();
-		//final Nodeid revision = Nodeid.fromBinary(revisionBytes, 0);
-		// cache last revision (its delta and baseRev)
+		int revCount = revlogStream.revisionCount();
+		lastEntryIndex = revCount == 0 ? NO_REVISION : revCount - 1;
+		populateLastEntry();
+		//
 		PatchGenerator pg = new PatchGenerator();
-		byte[] prev = null;
-		Patch patch = pg.delta(prev, content);
-		byte[] patchContent;
-		// rest as in HgCloneCommand
+		Patch patch = pg.delta(lastEntryContent, content);
+		int patchSerializedLength = patch.serializedLength();
+		
+		final boolean writeComplete = preferCompleteOverPatch(patchSerializedLength, content.length);
+		DataSerializer.DataSource dataSource = writeComplete ? new DataSerializer.ByteArrayDataSource(content) : patch.new PatchDataSource();
+		revlogDataZip.reset(dataSource);
+		final int compressedLen;
+		final boolean useUncompressedData = preferCompressedOverComplete(revlogDataZip.getCompressedLength(), dataSource.serializeLength());
+		if (useUncompressedData) {
+			// compression wasn't too effective,
+			compressedLen = dataSource.serializeLength() + 1 /*1 byte for 'u' - uncompressed prefix byte*/;
+		} else {
+			compressedLen= revlogDataZip.getCompressedLength();
+		}
+		//
+		Nodeid p1Rev = revision(p1);
+		Nodeid p2Rev = revision(p2);
+		byte[] revisionNodeidBytes = dh.sha1(p1Rev, p2Rev, content).asBinary();
+		//
+
+		DataSerializer indexFile, dataFile, activeFile;
+		indexFile = dataFile = activeFile = null;
+		try {
+			//
+			activeFile = indexFile = revlogStream.getIndexStreamWriter();
+			final boolean isInlineData = revlogStream.isInlineData();
+			HeaderWriter revlogHeader = new HeaderWriter(isInlineData);
+			revlogHeader.length(content.length, compressedLen);
+			revlogHeader.nodeid(revisionNodeidBytes);
+			revlogHeader.linkRevision(linkRevision);
+			revlogHeader.parents(p1, p2);
+			revlogHeader.baseRevision(writeComplete ? lastEntryIndex+1 : lastEntryBase);
+			//
+			revlogHeader.serialize(indexFile);
+			
+			if (isInlineData) {
+				dataFile = indexFile;
+			} else {
+				dataFile = revlogStream.getDataStreamWriter();
+			}
+			activeFile = dataFile;
+			if (useUncompressedData) {
+				dataFile.writeByte((byte) 'u');
+				dataSource.serialize(dataFile);
+			} else {
+				int actualCompressedLenWritten = revlogDataZip.writeCompressedData(dataFile);
+				if (actualCompressedLenWritten != compressedLen) {
+					throw new HgInvalidStateException(String.format("Expected %d bytes of compressed data, but actually wrote %d in %s", compressedLen, actualCompressedLenWritten, revlogStream.getDataFileName()));
+				}
+			}
+			
+			lastEntryContent = content;
+			lastEntryBase = revlogHeader.baseRevision();
+			lastEntryIndex++;
+			lastEntryRevision = Nodeid.fromBinary(revisionNodeidBytes, 0);
+			revisionCache.put(lastEntryIndex, lastEntryRevision);
+		} catch (IOException ex) {
+			String m = String.format("Failed to write revision %d", lastEntryIndex+1, null);
+			HgInvalidControlFileException t = new HgInvalidControlFileException(m, ex, null);
+			if (activeFile == dataFile) {
+				throw revlogStream.initWithDataFile(t);
+			} else {
+				throw revlogStream.initWithIndexFile(t);
+			}
+		} finally {
+			indexFile.done();
+			if (dataFile != null && dataFile != indexFile) {
+				dataFile.done();
+			}
+		}
 	}
 	
-	private Nodeid parent(int parentIndex) {
-		return null;
+	private RevlogStream revlogStream;
+	private Nodeid revision(int revisionIndex) {
+		if (revisionIndex == NO_REVISION) {
+			return Nodeid.NULL;
+		}
+		Nodeid n = revisionCache.get(revisionIndex);
+		if (n == null) {
+			n = Nodeid.fromBinary(revlogStream.nodeid(revisionIndex), 0);
+			revisionCache.put(revisionIndex, n);
+		}
+		return n;
+	}
+	
+	private void populateLastEntry() throws HgInvalidControlFileException {
+		if (lastEntryIndex != NO_REVISION && lastEntryContent == null) {
+			assert lastEntryIndex >= 0;
+			final IOException[] failure = new IOException[1];
+			revlogStream.iterate(lastEntryIndex, lastEntryIndex, true, new RevlogStream.Inspector() {
+				
+				public void next(int revisionIndex, int actualLen, int baseRevision, int linkRevision, int parent1Revision, int parent2Revision, byte[] nodeid, DataAccess data) {
+					try {
+						lastEntryBase = baseRevision;
+						lastEntryRevision = Nodeid.fromBinary(nodeid, 0);
+						lastEntryContent = data.byteArray();
+					} catch (IOException ex) {
+						failure[0] = ex;
+					}
+				}
+			});
+			if (failure[0] != null) {
+				String m = String.format("Failed to get content of most recent revision %d", lastEntryIndex);
+				throw revlogStream.initWithDataFile(new HgInvalidControlFileException(m, failure[0], null));
+			}
+		}
+	}
+	
+	public static boolean preferCompleteOverPatch(int patchLength, int fullContentLength) {
+		return !decideWorthEffort(patchLength, fullContentLength);
+	}
+	
+	public static boolean preferCompressedOverComplete(int compressedLen, int fullContentLength) {
+		if (compressedLen <= 0) { // just in case, meaningless otherwise
+			return false;
+		}
+		return decideWorthEffort(compressedLen, fullContentLength);
+	}
+
+	// true if length obtained with effort is worth it 
+	private static boolean decideWorthEffort(int lengthWithExtraEffort, int lengthWithoutEffort) {
+		return lengthWithExtraEffort < (/* 3/4 of original */lengthWithoutEffort - (lengthWithoutEffort >>> 2));
 	}
 }
--- a/src/org/tmatesoft/hg/repo/HgBundle.java	Wed Jan 30 15:48:36 2013 +0100
+++ b/src/org/tmatesoft/hg/repo/HgBundle.java	Mon Feb 04 18:00:55 2013 +0100
@@ -60,7 +60,7 @@
 	}
 
 	private DataAccess getDataStream() throws IOException {
-		DataAccess da = accessProvider.create(bundleFile);
+		DataAccess da = accessProvider.createReader(bundleFile);
 		byte[] signature = new byte[6];
 		if (da.length() > 6) {
 			da.readBytes(signature, 0, 6);
--- a/src/org/tmatesoft/hg/repo/Revlog.java	Wed Jan 30 15:48:36 2013 +0100
+++ b/src/org/tmatesoft/hg/repo/Revlog.java	Mon Feb 04 18:00:55 2013 +0100
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2010-2012 TMate Software Ltd
+ * Copyright (c) 2010-2013 TMate Software Ltd
  *  
  * This program is free software; you can redistribute it and/or modify
  * it under the terms of the GNU General Public License as published by
@@ -84,11 +84,14 @@
 	}
 	
 	/**
-	 * @return index of last known revision, a.k.a. {@link HgRepository#TIP}
+	 * @return index of last known revision, a.k.a. {@link HgRepository#TIP}, or {@link HgRepository#NO_REVISION} if revlog is empty
 	 * @throws HgRuntimeException subclass thereof to indicate issues with the library. <em>Runtime exception</em>
 	 */
 	public final int getLastRevision() throws HgRuntimeException {
-		return content.revisionCount() - 1;
+		// although old code gives correct result when revlog is empty (NO_REVISION deliberately == -1), 
+		// it's still better to be explicit
+		int revCount = content.revisionCount();
+		return revCount == 0 ? NO_REVISION : revCount - 1;
 	}
 
 	/**
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test/org/tmatesoft/hg/test/TestCommit.java	Mon Feb 04 18:00:55 2013 +0100
@@ -0,0 +1,33 @@
+/*
+ * Copyright (c) 2013 TMate Software Ltd
+ *  
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; version 2 of the License.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * For information on how to redistribute this software under
+ * the terms of a license other than GNU General Public License
+ * contact TMate Software at support@hg4j.com
+ */
+package org.tmatesoft.hg.test;
+
+import org.junit.Assert;
+import org.junit.Test;
+
+/**
+ * 
+ * @author Artem Tikhomirov
+ * @author TMate Software Ltd.
+ */
+public class TestCommit {
+
+	@Test
+	public void testCommitToEmpty() throws Exception {
+		Assert.fail();
+	}
+}