1 /* 2 * Copyright (C) 2010, 2013 Marc Strapetz <marc.strapetz@syntevo.com> 3 * Copyright (C) 2015, Ivan Motsch <ivan.motsch@bsiag.com> 4 * and other copyright owners as documented in the project's IP log. 5 * 6 * This program and the accompanying materials are made available 7 * under the terms of the Eclipse Distribution License v1.0 which 8 * accompanies this distribution, is reproduced below, and is 9 * available at http://www.eclipse.org/org/documents/edl-v10.php 10 * 11 * All rights reserved. 12 * 13 * Redistribution and use in source and binary forms, with or 14 * without modification, are permitted provided that the following 15 * conditions are met: 16 * 17 * - Redistributions of source code must retain the above copyright 18 * notice, this list of conditions and the following disclaimer. 19 * 20 * - Redistributions in binary form must reproduce the above 21 * copyright notice, this list of conditions and the following 22 * disclaimer in the documentation and/or other materials provided 23 * with the distribution. 24 * 25 * - Neither the name of the Eclipse Foundation, Inc. nor the 26 * names of its contributors may be used to endorse or promote 27 * products derived from this software without specific prior 28 * written permission. 29 * 30 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND 31 * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, 32 * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 33 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 34 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR 35 * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 36 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 37 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; 38 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER 39 * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, 40 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 41 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF 42 * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 43 */ 44 45 package org.eclipse.jgit.util.io; 46 47 import java.io.IOException; 48 import java.io.InputStream; 49 50 import org.eclipse.jgit.diff.RawText; 51 52 /** 53 * An InputStream that normalizes CRLF to LF. 54 * 55 * Existing single CR are not changed to LF, but retained as is. 56 * 57 * Optionally, a binary check on the first 8000 bytes is performed and in case 58 * of binary files, canonicalization is turned off (for the complete file). 59 * <p> 60 * This is the former EolCanonicalizingInputStream with a new name in order to 61 * have same naming for all LF / CRLF streams 62 * 63 * @since 4.3 64 */ 65 public class AutoLFInputStream extends InputStream { 66 private final byte[] single = new byte[1]; 67 68 private final byte[] buf = new byte[8096]; 69 70 private final InputStream in; 71 72 private int cnt; 73 74 private int ptr; 75 76 private boolean isBinary; 77 78 private boolean detectBinary; 79 80 private boolean abortIfBinary; 81 82 /** 83 * A special exception thrown when {@link AutoLFInputStream} is told to 84 * throw an exception when attempting to read a binary file. The exception 85 * may be thrown at any stage during reading. 86 * 87 * @since 3.3 88 */ 89 public static class IsBinaryException extends IOException { 90 private static final long serialVersionUID = 1L; 91 92 IsBinaryException() { 93 super(); 94 } 95 } 96 97 /** 98 * Creates a new InputStream, wrapping the specified stream 99 * 100 * @param in 101 * raw input stream 102 * @param detectBinary 103 * whether binaries should be detected 104 * @since 2.0 105 */ 106 public AutoLFInputStream(InputStream in, boolean detectBinary) { 107 this(in, detectBinary, false); 108 } 109 110 /** 111 * Creates a new InputStream, wrapping the specified stream 112 * 113 * @param in 114 * raw input stream 115 * @param detectBinary 116 * whether binaries should be detected 117 * @param abortIfBinary 118 * throw an IOException if the file is binary 119 * @since 3.3 120 */ 121 public AutoLFInputStream(InputStream in, boolean detectBinary, 122 boolean abortIfBinary) { 123 this.in = in; 124 this.detectBinary = detectBinary; 125 this.abortIfBinary = abortIfBinary; 126 } 127 128 @Override 129 public int read() throws IOException { 130 final int read = read(single, 0, 1); 131 return read == 1 ? single[0] & 0xff : -1; 132 } 133 134 @Override 135 public int read(byte[] bs, final int off, final int len) 136 throws IOException { 137 if (len == 0) 138 return 0; 139 140 if (cnt == -1) 141 return -1; 142 143 int i = off; 144 final int end = off + len; 145 146 while (i < end) { 147 if (ptr == cnt && !fillBuffer()) { 148 break; 149 } 150 151 byte b = buf[ptr++]; 152 if (isBinary || b != '\r') { 153 // Logic for binary files ends here 154 bs[i++] = b; 155 continue; 156 } 157 158 if (ptr == cnt && !fillBuffer()) { 159 bs[i++] = '\r'; 160 break; 161 } 162 163 if (buf[ptr] == '\n') { 164 bs[i++] = '\n'; 165 ptr++; 166 } else 167 bs[i++] = '\r'; 168 } 169 170 return i == off ? -1 : i - off; 171 } 172 173 /** 174 * @return true if the stream has detected as a binary so far 175 * @since 3.3 176 */ 177 public boolean isBinary() { 178 return isBinary; 179 } 180 181 @Override 182 public void close() throws IOException { 183 in.close(); 184 } 185 186 private boolean fillBuffer() throws IOException { 187 cnt = in.read(buf, 0, buf.length); 188 if (cnt < 1) 189 return false; 190 if (detectBinary) { 191 isBinary = RawText.isBinary(buf, cnt); 192 detectBinary = false; 193 if (isBinary && abortIfBinary) 194 throw new IsBinaryException(); 195 } 196 ptr = 0; 197 return true; 198 } 199 }