View Javadoc
1   /*
2    * Copyright (C) 2010, 2013 Marc Strapetz <marc.strapetz@syntevo.com>
3    * Copyright (C) 2015, Ivan Motsch <ivan.motsch@bsiag.com>
4    * and other copyright owners as documented in the project's IP log.
5    *
6    * This program and the accompanying materials are made available
7    * under the terms of the Eclipse Distribution License v1.0 which
8    * accompanies this distribution, is reproduced below, and is
9    * available at http://www.eclipse.org/org/documents/edl-v10.php
10   *
11   * All rights reserved.
12   *
13   * Redistribution and use in source and binary forms, with or
14   * without modification, are permitted provided that the following
15   * conditions are met:
16   *
17   * - Redistributions of source code must retain the above copyright
18   *   notice, this list of conditions and the following disclaimer.
19   *
20   * - Redistributions in binary form must reproduce the above
21   *   copyright notice, this list of conditions and the following
22   *   disclaimer in the documentation and/or other materials provided
23   *   with the distribution.
24   *
25   * - Neither the name of the Eclipse Foundation, Inc. nor the
26   *   names of its contributors may be used to endorse or promote
27   *   products derived from this software without specific prior
28   *   written permission.
29   *
30   * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
31   * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
32   * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
33   * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
34   * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
35   * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
36   * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
37   * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
38   * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
39   * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
40   * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
41   * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
42   * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
43   */
44  
45  package org.eclipse.jgit.util.io;
46  
47  import java.io.IOException;
48  import java.io.InputStream;
49  
50  import org.eclipse.jgit.diff.RawText;
51  
52  /**
53   * An InputStream that normalizes CRLF to LF.
54   *
55   * Existing single CR are not changed to LF, but retained as is.
56   *
57   * Optionally, a binary check on the first 8000 bytes is performed and in case
58   * of binary files, canonicalization is turned off (for the complete file).
59   * <p>
60   * This is the former EolCanonicalizingInputStream with a new name in order to
61   * have same naming for all LF / CRLF streams
62   *
63   * @since 4.3
64   */
65  public class AutoLFInputStream extends InputStream {
66  	private final byte[] single = new byte[1];
67  
68  	private final byte[] buf = new byte[8096];
69  
70  	private final InputStream in;
71  
72  	private int cnt;
73  
74  	private int ptr;
75  
76  	private boolean isBinary;
77  
78  	private boolean detectBinary;
79  
80  	private boolean abortIfBinary;
81  
82  	/**
83  	 * A special exception thrown when {@link AutoLFInputStream} is told to
84  	 * throw an exception when attempting to read a binary file. The exception
85  	 * may be thrown at any stage during reading.
86  	 *
87  	 * @since 3.3
88  	 */
89  	public static class IsBinaryException extends IOException {
90  		private static final long serialVersionUID = 1L;
91  
92  		IsBinaryException() {
93  			super();
94  		}
95  	}
96  
97  	/**
98  	 * Creates a new InputStream, wrapping the specified stream
99  	 *
100 	 * @param in
101 	 *            raw input stream
102 	 * @param detectBinary
103 	 *            whether binaries should be detected
104 	 * @since 2.0
105 	 */
106 	public AutoLFInputStream(InputStream in, boolean detectBinary) {
107 		this(in, detectBinary, false);
108 	}
109 
110 	/**
111 	 * Creates a new InputStream, wrapping the specified stream
112 	 *
113 	 * @param in
114 	 *            raw input stream
115 	 * @param detectBinary
116 	 *            whether binaries should be detected
117 	 * @param abortIfBinary
118 	 *            throw an IOException if the file is binary
119 	 * @since 3.3
120 	 */
121 	public AutoLFInputStream(InputStream in, boolean detectBinary,
122 			boolean abortIfBinary) {
123 		this.in = in;
124 		this.detectBinary = detectBinary;
125 		this.abortIfBinary = abortIfBinary;
126 	}
127 
128 	@Override
129 	public int read() throws IOException {
130 		final int read = read(single, 0, 1);
131 		return read == 1 ? single[0] & 0xff : -1;
132 	}
133 
134 	@Override
135 	public int read(byte[] bs, final int off, final int len)
136 			throws IOException {
137 		if (len == 0)
138 			return 0;
139 
140 		if (cnt == -1)
141 			return -1;
142 
143 		int i = off;
144 		final int end = off + len;
145 
146 		while (i < end) {
147 			if (ptr == cnt && !fillBuffer()) {
148 				break;
149 			}
150 
151 			byte b = buf[ptr++];
152 			if (isBinary || b != '\r') {
153 				// Logic for binary files ends here
154 				bs[i++] = b;
155 				continue;
156 			}
157 
158 			if (ptr == cnt && !fillBuffer()) {
159 				bs[i++] = '\r';
160 				break;
161 			}
162 
163 			if (buf[ptr] == '\n') {
164 				bs[i++] = '\n';
165 				ptr++;
166 			} else
167 				bs[i++] = '\r';
168 		}
169 
170 		return i == off ? -1 : i - off;
171 	}
172 
173 	/**
174 	 * @return true if the stream has detected as a binary so far
175 	 * @since 3.3
176 	 */
177 	public boolean isBinary() {
178 		return isBinary;
179 	}
180 
181 	@Override
182 	public void close() throws IOException {
183 		in.close();
184 	}
185 
186 	private boolean fillBuffer() throws IOException {
187 		cnt = in.read(buf, 0, buf.length);
188 		if (cnt < 1)
189 			return false;
190 		if (detectBinary) {
191 			isBinary = RawText.isBinary(buf, cnt);
192 			detectBinary = false;
193 			if (isBinary && abortIfBinary)
194 				throw new IsBinaryException();
195 		}
196 		ptr = 0;
197 		return true;
198 	}
199 }