View Javadoc
1   /*
2    * Copyright (C) 2008-2009, Google Inc.
3    * Copyright (C) 2008, Shawn O. Pearce <spearce@spearce.org>
4    * and other copyright owners as documented in the project's IP log.
5    *
6    * This program and the accompanying materials are made available
7    * under the terms of the Eclipse Distribution License v1.0 which
8    * accompanies this distribution, is reproduced below, and is
9    * available at http://www.eclipse.org/org/documents/edl-v10.php
10   *
11   * All rights reserved.
12   *
13   * Redistribution and use in source and binary forms, with or
14   * without modification, are permitted provided that the following
15   * conditions are met:
16   *
17   * - Redistributions of source code must retain the above copyright
18   *   notice, this list of conditions and the following disclaimer.
19   *
20   * - Redistributions in binary form must reproduce the above
21   *   copyright notice, this list of conditions and the following
22   *   disclaimer in the documentation and/or other materials provided
23   *   with the distribution.
24   *
25   * - Neither the name of the Eclipse Foundation, Inc. nor the
26   *   names of its contributors may be used to endorse or promote
27   *   products derived from this software without specific prior
28   *   written permission.
29   *
30   * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
31   * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
32   * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
33   * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
34   * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
35   * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
36   * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
37   * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
38   * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
39   * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
40   * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
41   * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
42   * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
43   */
44  
45  package org.eclipse.jgit.util;
46  
47  import java.io.BufferedOutputStream;
48  import java.io.File;
49  import java.io.FileInputStream;
50  import java.io.FileOutputStream;
51  import java.io.IOException;
52  import java.io.InputStream;
53  import java.io.OutputStream;
54  import java.util.ArrayList;
55  
56  import org.eclipse.jgit.internal.JGitText;
57  import org.eclipse.jgit.lib.NullProgressMonitor;
58  import org.eclipse.jgit.lib.ProgressMonitor;
59  import org.eclipse.jgit.util.io.SafeBufferedOutputStream;
60  
61  /**
62   * A fully buffered output stream.
63   * <p>
64   * Subclasses determine the behavior when the in-memory buffer capacity has been
65   * exceeded and additional bytes are still being received for output.
66   */
67  public abstract class TemporaryBuffer extends OutputStream {
68  	/** Default limit for in-core storage. */
69  	protected static final int DEFAULT_IN_CORE_LIMIT = 1024 * 1024;
70  
71  	/** Chain of data, if we are still completely in-core; otherwise null. */
72  	private ArrayList<Block> blocks;
73  
74  	/**
75  	 * Maximum number of bytes we will permit storing in memory.
76  	 * <p>
77  	 * When this limit is reached the data will be shifted to a file on disk,
78  	 * preventing the JVM heap from growing out of control.
79  	 */
80  	private int inCoreLimit;
81  
82  	/** Initial size of block list. */
83  	private int initialBlocks;
84  
85  	/** If {@link #inCoreLimit} has been reached, remainder goes here. */
86  	private OutputStream overflow;
87  
88  	/**
89  	 * Create a new empty temporary buffer.
90  	 *
91  	 * @param limit
92  	 *            maximum number of bytes to store in memory before entering the
93  	 *            overflow output path; also used as the estimated size.
94  	 */
95  	protected TemporaryBuffer(final int limit) {
96  		this(limit, limit);
97  	}
98  
99  	/**
100 	 * Create a new empty temporary buffer.
101 	 *
102 	 * @param estimatedSize
103 	 *            estimated size of storage used, to size the initial list of
104 	 *            block pointers.
105 	 * @param limit
106 	 *            maximum number of bytes to store in memory before entering the
107 	 *            overflow output path.
108 	 * @since 4.0
109 	 */
110 	protected TemporaryBuffer(final int estimatedSize, final int limit) {
111 		if (estimatedSize > limit)
112 			throw new IllegalArgumentException();
113 		this.inCoreLimit = limit;
114 		this.initialBlocks = (estimatedSize - 1) / Block.SZ + 1;
115 		reset();
116 	}
117 
118 	@Override
119 	public void write(final int b) throws IOException {
120 		if (overflow != null) {
121 			overflow.write(b);
122 			return;
123 		}
124 
125 		Block s = last();
126 		if (s.isFull()) {
127 			if (reachedInCoreLimit()) {
128 				overflow.write(b);
129 				return;
130 			}
131 
132 			s = new Block();
133 			blocks.add(s);
134 		}
135 		s.buffer[s.count++] = (byte) b;
136 	}
137 
138 	@Override
139 	public void write(final byte[] b, int off, int len) throws IOException {
140 		if (overflow == null) {
141 			while (len > 0) {
142 				Block s = last();
143 				if (s.isFull()) {
144 					if (reachedInCoreLimit())
145 						break;
146 
147 					s = new Block();
148 					blocks.add(s);
149 				}
150 
151 				final int n = Math.min(s.buffer.length - s.count, len);
152 				System.arraycopy(b, off, s.buffer, s.count, n);
153 				s.count += n;
154 				len -= n;
155 				off += n;
156 			}
157 		}
158 
159 		if (len > 0)
160 			overflow.write(b, off, len);
161 	}
162 
163 	/**
164 	 * Dumps the entire buffer into the overflow stream, and flushes it.
165 	 *
166 	 * @throws IOException
167 	 *             the overflow stream cannot be started, or the buffer contents
168 	 *             cannot be written to it, or it failed to flush.
169 	 */
170 	protected void doFlush() throws IOException {
171 		if (overflow == null)
172 			switchToOverflow();
173 		overflow.flush();
174 	}
175 
176 	/**
177 	 * Copy all bytes remaining on the input stream into this buffer.
178 	 *
179 	 * @param in
180 	 *            the stream to read from, until EOF is reached.
181 	 * @throws IOException
182 	 *             an error occurred reading from the input stream, or while
183 	 *             writing to a local temporary file.
184 	 */
185 	public void copy(final InputStream in) throws IOException {
186 		if (blocks != null) {
187 			for (;;) {
188 				Block s = last();
189 				if (s.isFull()) {
190 					if (reachedInCoreLimit())
191 						break;
192 					s = new Block();
193 					blocks.add(s);
194 				}
195 
196 				int n = in.read(s.buffer, s.count, s.buffer.length - s.count);
197 				if (n < 1)
198 					return;
199 				s.count += n;
200 			}
201 		}
202 
203 		final byte[] tmp = new byte[Block.SZ];
204 		int n;
205 		while ((n = in.read(tmp)) > 0)
206 			overflow.write(tmp, 0, n);
207 	}
208 
209 	/**
210 	 * Obtain the length (in bytes) of the buffer.
211 	 * <p>
212 	 * The length is only accurate after {@link #close()} has been invoked.
213 	 *
214 	 * @return total length of the buffer, in bytes.
215 	 */
216 	public long length() {
217 		return inCoreLength();
218 	}
219 
220 	private long inCoreLength() {
221 		final Block last = last();
222 		return ((long) blocks.size() - 1) * Block.SZ + last.count;
223 	}
224 
225 	/**
226 	 * Convert this buffer's contents into a contiguous byte array.
227 	 * <p>
228 	 * The buffer is only complete after {@link #close()} has been invoked.
229 	 *
230 	 * @return the complete byte array; length matches {@link #length()}.
231 	 * @throws IOException
232 	 *             an error occurred reading from a local temporary file
233 	 * @throws OutOfMemoryError
234 	 *             the buffer cannot fit in memory
235 	 */
236 	public byte[] toByteArray() throws IOException {
237 		final long len = length();
238 		if (Integer.MAX_VALUE < len)
239 			throw new OutOfMemoryError(JGitText.get().lengthExceedsMaximumArraySize);
240 		final byte[] out = new byte[(int) len];
241 		int outPtr = 0;
242 		for (final Block b : blocks) {
243 			System.arraycopy(b.buffer, 0, out, outPtr, b.count);
244 			outPtr += b.count;
245 		}
246 		return out;
247 	}
248 
249 	/**
250 	 * Send this buffer to an output stream.
251 	 * <p>
252 	 * This method may only be invoked after {@link #close()} has completed
253 	 * normally, to ensure all data is completely transferred.
254 	 *
255 	 * @param os
256 	 *            stream to send this buffer's complete content to.
257 	 * @param pm
258 	 *            if not null progress updates are sent here. Caller should
259 	 *            initialize the task and the number of work units to <code>
260 	 *            {@link #length()}/1024</code>.
261 	 * @throws IOException
262 	 *             an error occurred reading from a temporary file on the local
263 	 *             system, or writing to the output stream.
264 	 */
265 	public void writeTo(final OutputStream os, ProgressMonitor pm)
266 			throws IOException {
267 		if (pm == null)
268 			pm = NullProgressMonitor.INSTANCE;
269 		for (final Block b : blocks) {
270 			os.write(b.buffer, 0, b.count);
271 			pm.update(b.count / 1024);
272 		}
273 	}
274 
275 	/**
276 	 * Open an input stream to read from the buffered data.
277 	 * <p>
278 	 * This method may only be invoked after {@link #close()} has completed
279 	 * normally, to ensure all data is completely transferred.
280 	 *
281 	 * @return a stream to read from the buffer. The caller must close the
282 	 *         stream when it is no longer useful.
283 	 * @throws IOException
284 	 *             an error occurred opening the temporary file.
285 	 */
286 	public InputStream openInputStream() throws IOException {
287 		return new BlockInputStream();
288 	}
289 
290 	/** Reset this buffer for reuse, purging all buffered content. */
291 	public void reset() {
292 		if (overflow != null) {
293 			destroy();
294 		}
295 		if (blocks != null)
296 			blocks.clear();
297 		else
298 			blocks = new ArrayList<Block>(initialBlocks);
299 		blocks.add(new Block(Math.min(inCoreLimit, Block.SZ)));
300 	}
301 
302 	/**
303 	 * Open the overflow output stream, so the remaining output can be stored.
304 	 *
305 	 * @return the output stream to receive the buffered content, followed by
306 	 *         the remaining output.
307 	 * @throws IOException
308 	 *             the buffer cannot create the overflow stream.
309 	 */
310 	protected abstract OutputStream overflow() throws IOException;
311 
312 	private Block last() {
313 		return blocks.get(blocks.size() - 1);
314 	}
315 
316 	private boolean reachedInCoreLimit() throws IOException {
317 		if (inCoreLength() < inCoreLimit)
318 			return false;
319 
320 		switchToOverflow();
321 		return true;
322 	}
323 
324 	private void switchToOverflow() throws IOException {
325 		overflow = overflow();
326 
327 		final Block last = blocks.remove(blocks.size() - 1);
328 		for (final Block b : blocks)
329 			overflow.write(b.buffer, 0, b.count);
330 		blocks = null;
331 
332 		overflow = new SafeBufferedOutputStream(overflow, Block.SZ);
333 		overflow.write(last.buffer, 0, last.count);
334 	}
335 
336 	public void close() throws IOException {
337 		if (overflow != null) {
338 			try {
339 				overflow.close();
340 			} finally {
341 				overflow = null;
342 			}
343 		}
344 	}
345 
346 	/** Clear this buffer so it has no data, and cannot be used again. */
347 	public void destroy() {
348 		blocks = null;
349 
350 		if (overflow != null) {
351 			try {
352 				overflow.close();
353 			} catch (IOException err) {
354 				// We shouldn't encounter an error closing the file.
355 			} finally {
356 				overflow = null;
357 			}
358 		}
359 	}
360 
361 	/**
362 	 * A fully buffered output stream using local disk storage for large data.
363 	 * <p>
364 	 * Initially this output stream buffers to memory and is therefore similar
365 	 * to ByteArrayOutputStream, but it shifts to using an on disk temporary
366 	 * file if the output gets too large.
367 	 * <p>
368 	 * The content of this buffered stream may be sent to another OutputStream
369 	 * only after this stream has been properly closed by {@link #close()}.
370 	 */
371 	public static class LocalFile extends TemporaryBuffer {
372 		/** Directory to store the temporary file under. */
373 		private final File directory;
374 
375 		/**
376 		 * Location of our temporary file if we are on disk; otherwise null.
377 		 * <p>
378 		 * If we exceeded the {@link #inCoreLimit} we nulled out {@link #blocks}
379 		 * and created this file instead. All output goes here through
380 		 * {@link #overflow}.
381 		 */
382 		private File onDiskFile;
383 
384 		/**
385 		 * Create a new temporary buffer, limiting memory usage.
386 		 *
387 		 * @param directory
388 		 *            if the buffer has to spill over into a temporary file, the
389 		 *            directory where the file should be saved. If null the
390 		 *            system default temporary directory (for example /tmp) will
391 		 *            be used instead.
392 		 */
393 		public LocalFile(final File directory) {
394 			this(directory, DEFAULT_IN_CORE_LIMIT);
395 		}
396 
397 		/**
398 		 * Create a new temporary buffer, limiting memory usage.
399 		 *
400 		 * @param directory
401 		 *            if the buffer has to spill over into a temporary file, the
402 		 *            directory where the file should be saved. If null the
403 		 *            system default temporary directory (for example /tmp) will
404 		 *            be used instead.
405 		 * @param inCoreLimit
406 		 *            maximum number of bytes to store in memory. Storage beyond
407 		 *            this limit will use the local file.
408 		 */
409 		public LocalFile(final File directory, final int inCoreLimit) {
410 			super(inCoreLimit);
411 			this.directory = directory;
412 		}
413 
414 		protected OutputStream overflow() throws IOException {
415 			onDiskFile = File.createTempFile("jgit_", ".buf", directory); //$NON-NLS-1$ //$NON-NLS-2$
416 			return new BufferedOutputStream(new FileOutputStream(onDiskFile));
417 		}
418 
419 		public long length() {
420 			if (onDiskFile == null) {
421 				return super.length();
422 			}
423 			return onDiskFile.length();
424 		}
425 
426 		public byte[] toByteArray() throws IOException {
427 			if (onDiskFile == null) {
428 				return super.toByteArray();
429 			}
430 
431 			final long len = length();
432 			if (Integer.MAX_VALUE < len)
433 				throw new OutOfMemoryError(JGitText.get().lengthExceedsMaximumArraySize);
434 			final byte[] out = new byte[(int) len];
435 			final FileInputStream in = new FileInputStream(onDiskFile);
436 			try {
437 				IO.readFully(in, out, 0, (int) len);
438 			} finally {
439 				in.close();
440 			}
441 			return out;
442 		}
443 
444 		public void writeTo(final OutputStream os, ProgressMonitor pm)
445 				throws IOException {
446 			if (onDiskFile == null) {
447 				super.writeTo(os, pm);
448 				return;
449 			}
450 			if (pm == null)
451 				pm = NullProgressMonitor.INSTANCE;
452 			final FileInputStream in = new FileInputStream(onDiskFile);
453 			try {
454 				int cnt;
455 				final byte[] buf = new byte[Block.SZ];
456 				while ((cnt = in.read(buf)) >= 0) {
457 					os.write(buf, 0, cnt);
458 					pm.update(cnt / 1024);
459 				}
460 			} finally {
461 				in.close();
462 			}
463 		}
464 
465 		@Override
466 		public InputStream openInputStream() throws IOException {
467 			if (onDiskFile == null)
468 				return super.openInputStream();
469 			return new FileInputStream(onDiskFile);
470 		}
471 
472 		@Override
473 		public void destroy() {
474 			super.destroy();
475 
476 			if (onDiskFile != null) {
477 				try {
478 					if (!onDiskFile.delete())
479 						onDiskFile.deleteOnExit();
480 				} finally {
481 					onDiskFile = null;
482 				}
483 			}
484 		}
485 	}
486 
487 	/**
488 	 * A temporary buffer that will never exceed its in-memory limit.
489 	 * <p>
490 	 * If the in-memory limit is reached an IOException is thrown, rather than
491 	 * attempting to spool to local disk.
492 	 */
493 	public static class Heap extends TemporaryBuffer {
494 		/**
495 		 * Create a new heap buffer with a maximum storage limit.
496 		 *
497 		 * @param limit
498 		 *            maximum number of bytes that can be stored in this buffer;
499 		 *            also used as the estimated size. Storing beyond this many
500 		 *            will cause an IOException to be thrown during write.
501 		 */
502 		public Heap(final int limit) {
503 			super(limit);
504 		}
505 
506 		/**
507 		 * Create a new heap buffer with a maximum storage limit.
508 		 *
509 		 * @param estimatedSize
510 		 *            estimated size of storage used, to size the initial list of
511 		 *            block pointers.
512 		 * @param limit
513 		 *            maximum number of bytes that can be stored in this buffer.
514 		 *            Storing beyond this many will cause an IOException to be
515 		 *            thrown during write.
516 		 * @since 4.0
517 		 */
518 		public Heap(final int estimatedSize, final int limit) {
519 			super(estimatedSize, limit);
520 		}
521 
522 		@Override
523 		protected OutputStream overflow() throws IOException {
524 			throw new IOException(JGitText.get().inMemoryBufferLimitExceeded);
525 		}
526 	}
527 
528 	static class Block {
529 		static final int SZ = 8 * 1024;
530 
531 		final byte[] buffer;
532 
533 		int count;
534 
535 		Block() {
536 			buffer = new byte[SZ];
537 		}
538 
539 		Block(int sz) {
540 			buffer = new byte[sz];
541 		}
542 
543 		boolean isFull() {
544 			return count == buffer.length;
545 		}
546 	}
547 
548 	private class BlockInputStream extends InputStream {
549 		private byte[] singleByteBuffer;
550 		private int blockIndex;
551 		private Block block;
552 		private int blockPos;
553 
554 		BlockInputStream() {
555 			block = blocks.get(blockIndex);
556 		}
557 
558 		@Override
559 		public int read() throws IOException {
560 			if (singleByteBuffer == null)
561 				singleByteBuffer = new byte[1];
562 			int n = read(singleByteBuffer);
563 			return n == 1 ? singleByteBuffer[0] & 0xff : -1;
564 		}
565 
566 		@Override
567 		public long skip(long cnt) throws IOException {
568 			long skipped = 0;
569 			while (0 < cnt) {
570 				int n = (int) Math.min(block.count - blockPos, cnt);
571 				if (0 < n) {
572 					blockPos += n;
573 					skipped += n;
574 					cnt -= n;
575 				} else if (nextBlock())
576 					continue;
577 				else
578 					break;
579 			}
580 			return skipped;
581 		}
582 
583 		@Override
584 		public int read(byte[] b, int off, int len) throws IOException {
585 			if (len == 0)
586 				return 0;
587 			int copied = 0;
588 			while (0 < len) {
589 				int c = Math.min(block.count - blockPos, len);
590 				if (0 < c) {
591 					System.arraycopy(block.buffer, blockPos, b, off, c);
592 					blockPos += c;
593 					off += c;
594 					len -= c;
595 					copied += c;
596 				} else if (nextBlock())
597 					continue;
598 				else
599 					break;
600 			}
601 			return 0 < copied ? copied : -1;
602 		}
603 
604 		private boolean nextBlock() {
605 			if (++blockIndex < blocks.size()) {
606 				block = blocks.get(blockIndex);
607 				blockPos = 0;
608 				return true;
609 			}
610 			return false;
611 		}
612 	}
613 }