Browse Source

[bug-63576] support capitalized text in WordExtractor (HWPF)

git-svn-id: https://svn.apache.org/repos/asf/poi/trunk@1903738 13f79535-47bb-0310-9956-ffa450edef68
tags/REL_5_2_3
PJ Fanning 1 year ago
parent
commit
913d1eecf5

+ 5
- 0
poi-scratchpad/src/main/java/org/apache/poi/hwpf/converter/AbstractWordConverter.java View File

@@ -52,6 +52,7 @@ import org.apache.poi.hwpf.usermodel.TableRow;
import org.apache.poi.poifs.filesystem.Entry;
import org.apache.poi.util.Beta;
import org.apache.poi.util.Internal;
import org.apache.poi.util.LocaleUtil;
import org.apache.poi.util.StringUtil;
import org.w3c.dom.Document;
import org.w3c.dom.Element;
@@ -445,6 +446,10 @@ public abstract class AbstractWordConverter {
continue;
}

if (characterRun.isCapitalized() || characterRun.isSmallCaps()) {
text = text.toUpperCase(LocaleUtil.getUserLocale());
}

if (characterRun.isSpecialCharacter()) {
if (text.charAt(0) == SPECCHAR_AUTONUMBERED_FOOTNOTE_REFERENCE
&& (wordDocument instanceof HWPFDocument)) {

+ 8
- 0
poi-scratchpad/src/test/java/org/apache/poi/hwpf/extractor/TestWordExtractor.java View File

@@ -402,6 +402,14 @@ public final class TestWordExtractor {
}
}

@Test
void testCapitalized() throws Exception {
try (WordExtractor wExt = openExtractor("capitalized.doc")) {
String text = wExt.getText().trim();
assertEquals("The following word is: CAPITALIZED.", text);
}
}

private WordExtractor openExtractor(String fileName) throws IOException {
try (InputStream is = docTests.openResourceAsStream(fileName)) {
return new WordExtractor(is);

BIN
test-data/document/capitalized.doc View File


Loading…
Cancel
Save