You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

WhitespaceCollapser.java 6.2KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150
  1. /*
  2. * $Id$
  3. * ============================================================================
  4. * The Apache Software License, Version 1.1
  5. * ============================================================================
  6. *
  7. * Copyright (C) 1999-2003 The Apache Software Foundation. All rights reserved.
  8. *
  9. * Redistribution and use in source and binary forms, with or without modifica-
  10. * tion, are permitted provided that the following conditions are met:
  11. *
  12. * 1. Redistributions of source code must retain the above copyright notice,
  13. * this list of conditions and the following disclaimer.
  14. *
  15. * 2. Redistributions in binary form must reproduce the above copyright notice,
  16. * this list of conditions and the following disclaimer in the documentation
  17. * and/or other materials provided with the distribution.
  18. *
  19. * 3. The end-user documentation included with the redistribution, if any, must
  20. * include the following acknowledgment: "This product includes software
  21. * developed by the Apache Software Foundation (http://www.apache.org/)."
  22. * Alternately, this acknowledgment may appear in the software itself, if
  23. * and wherever such third-party acknowledgments normally appear.
  24. *
  25. * 4. The names "FOP" and "Apache Software Foundation" must not be used to
  26. * endorse or promote products derived from this software without prior
  27. * written permission. For written permission, please contact
  28. * apache@apache.org.
  29. *
  30. * 5. Products derived from this software may not be called "Apache", nor may
  31. * "Apache" appear in their name, without prior written permission of the
  32. * Apache Software Foundation.
  33. *
  34. * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED WARRANTIES,
  35. * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
  36. * FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
  37. * APACHE SOFTWARE FOUNDATION OR ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT,
  38. * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLU-
  39. * DING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
  40. * OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
  41. * ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  42. * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
  43. * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  44. * ============================================================================
  45. *
  46. * This software consists of voluntary contributions made by many individuals
  47. * on behalf of the Apache Software Foundation and was originally created by
  48. * James Tauber <jtauber@jtauber.com>. For more information on the Apache
  49. * Software Foundation, please see <http://www.apache.org/>.
  50. */
  51. /*
  52. * This file is part of the RTF library of the FOP project, which was originally
  53. * created by Bertrand Delacretaz <bdelacretaz@codeconsult.ch> and by other
  54. * contributors to the jfor project (www.jfor.org), who agreed to donate jfor to
  55. * the FOP project.
  56. */
  57. package org.apache.fop.render.rtf.rtflib.rtfdoc;
  58. import java.util.Iterator;
  59. import java.util.StringTokenizer;
  60. /** Collapses whitespace of an RtfContainer that contains RtfText elements
  61. * @author Bertrand Delacretaz bdelacretaz@codeconsult.ch
  62. */
  63. class WhitespaceCollapser {
  64. private static final String SPACE = " ";
  65. private boolean lastEndSpace = true;
  66. /** remove extra whitespace in RtfText elements that are inside c */
  67. WhitespaceCollapser(RtfContainer c) {
  68. // process all texts
  69. for (Iterator it = c.getChildren().iterator(); it.hasNext();) {
  70. final Object kid = it.next();
  71. if (kid instanceof RtfText) {
  72. RtfText current = (RtfText)kid;
  73. processText(current);
  74. } else if (kid instanceof RtfString) {
  75. RtfString current = (RtfString)kid;
  76. processString(current);
  77. } else {
  78. // if there is something between two texts, it counts for a space
  79. lastEndSpace = true;
  80. }
  81. }
  82. }
  83. /** process one RtfText from our container */
  84. private void processText(RtfText txt) {
  85. final String newString=processString(txt.getText());
  86. if(newString!=null) {
  87. txt.setText(newString);
  88. }
  89. }
  90. /** process one RtfString from our container */
  91. private void processString(RtfString txt) {
  92. final String newString=processString(txt.getText());
  93. if(newString!=null) {
  94. txt.setText(newString);
  95. }
  96. }
  97. /** process one String */
  98. private String processString(String txt) {
  99. final String orig = txt;
  100. // tokenize the text based on whitespace and regenerate it so as
  101. // to collapse multiple spaces into one
  102. if(orig==null) {
  103. return null;
  104. } else if (orig.length() > 0) {
  105. final boolean allSpaces = orig.trim().length() == 0;
  106. final boolean endSpace = allSpaces
  107. || Character.isWhitespace(orig.charAt(orig.length() - 1));
  108. final boolean beginSpace = Character.isWhitespace(orig.charAt(0));
  109. final StringBuffer sb = new StringBuffer(orig.length());
  110. // if text contains spaces only, keep at most one
  111. if (allSpaces) {
  112. if (!lastEndSpace) {
  113. sb.append(SPACE);
  114. }
  115. } else {
  116. // TODO to be compatible with different Locales, should use Character.isWhitespace
  117. // instead of this limited list
  118. boolean first = true;
  119. final StringTokenizer stk = new StringTokenizer(txt, " \t\n\r");
  120. while (stk.hasMoreTokens()) {
  121. if (first && beginSpace && !lastEndSpace) {
  122. sb.append(SPACE);
  123. }
  124. first = false;
  125. sb.append(stk.nextToken());
  126. if (stk.hasMoreTokens() || endSpace) {
  127. sb.append(SPACE);
  128. }
  129. }
  130. }
  131. lastEndSpace = endSpace;
  132. return sb.toString();
  133. } else {
  134. return "";
  135. }
  136. }
  137. }