You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

EolCanonicalizingInputStream.java 3.9KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146
  1. /*
  2. * Copyright (C) 2010, Marc Strapetz <marc.strapetz@syntevo.com>
  3. * and other copyright owners as documented in the project's IP log.
  4. *
  5. * This program and the accompanying materials are made available
  6. * under the terms of the Eclipse Distribution License v1.0 which
  7. * accompanies this distribution, is reproduced below, and is
  8. * available at http://www.eclipse.org/org/documents/edl-v10.php
  9. *
  10. * All rights reserved.
  11. *
  12. * Redistribution and use in source and binary forms, with or
  13. * without modification, are permitted provided that the following
  14. * conditions are met:
  15. *
  16. * - Redistributions of source code must retain the above copyright
  17. * notice, this list of conditions and the following disclaimer.
  18. *
  19. * - Redistributions in binary form must reproduce the above
  20. * copyright notice, this list of conditions and the following
  21. * disclaimer in the documentation and/or other materials provided
  22. * with the distribution.
  23. *
  24. * - Neither the name of the Eclipse Foundation, Inc. nor the
  25. * names of its contributors may be used to endorse or promote
  26. * products derived from this software without specific prior
  27. * written permission.
  28. *
  29. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
  30. * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
  31. * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  32. * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  33. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
  34. * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  35. * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
  36. * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  37. * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  38. * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
  39. * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  40. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
  41. * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  42. */
  43. package org.eclipse.jgit.util.io;
  44. import java.io.IOException;
  45. import java.io.InputStream;
  46. import org.eclipse.jgit.diff.RawText;
  47. /**
  48. * An input stream which canonicalizes EOLs bytes on the fly to '\n'.
  49. *
  50. * Optionally, a binary check on the first 8000 bytes is performed
  51. * and in case of binary files, canonicalization is turned off
  52. * (for the complete file).
  53. */
  54. public class EolCanonicalizingInputStream extends InputStream {
  55. private final byte[] single = new byte[1];
  56. private final byte[] buf = new byte[8096];
  57. private final InputStream in;
  58. private int cnt;
  59. private int ptr;
  60. private boolean isBinary;
  61. private boolean detectBinary;
  62. /**
  63. * Creates a new InputStream, wrapping the specified stream
  64. *
  65. * @param in
  66. * raw input stream
  67. * @param detectBinary
  68. * whether binaries should be detected
  69. */
  70. public EolCanonicalizingInputStream(InputStream in, boolean detectBinary) {
  71. this.in = in;
  72. this.detectBinary = detectBinary;
  73. }
  74. @Override
  75. public int read() throws IOException {
  76. final int read = read(single, 0, 1);
  77. return read == 1 ? single[0] & 0xff : -1;
  78. }
  79. @Override
  80. public int read(byte[] bs, int off, int len) throws IOException {
  81. if (len == 0)
  82. return 0;
  83. if (cnt == -1)
  84. return -1;
  85. final int startOff = off;
  86. final int end = off + len;
  87. while (off < end) {
  88. if (ptr == cnt && !fillBuffer()) {
  89. break;
  90. }
  91. byte b = buf[ptr++];
  92. if (isBinary || b != '\r') {
  93. // Logic for binary files ends here
  94. bs[off++] = b;
  95. continue;
  96. }
  97. if (ptr == cnt && !fillBuffer()) {
  98. bs[off++] = '\r';
  99. break;
  100. }
  101. if (buf[ptr] == '\n') {
  102. bs[off++] = '\n';
  103. ptr++;
  104. } else
  105. bs[off++] = '\r';
  106. }
  107. return startOff == off ? -1 : off - startOff;
  108. }
  109. @Override
  110. public void close() throws IOException {
  111. in.close();
  112. }
  113. private boolean fillBuffer() throws IOException {
  114. cnt = in.read(buf, 0, buf.length);
  115. if (cnt < 1)
  116. return false;
  117. if (detectBinary) {
  118. isBinary = RawText.isBinary(buf, cnt);
  119. detectBinary = false;
  120. }
  121. ptr = 0;
  122. return true;
  123. }
  124. }