aboutsummaryrefslogtreecommitdiffstats
path: root/src/java/org/apache/poi
diff options
context:
space:
mode:
authorAndreas Beeker <kiwiwings@apache.org>2018-12-28 23:43:31 +0000
committerAndreas Beeker <kiwiwings@apache.org>2018-12-28 23:43:31 +0000
commitc039da1b94a24224bcd7d6a09b1828782a2acb00 (patch)
treea6e4f58d3565bdec89873d6582f0bb9afc32c8aa /src/java/org/apache/poi
parenta78bd71fc1f3bd60af434774744b5dfacfced403 (diff)
downloadpoi-c039da1b94a24224bcd7d6a09b1828782a2acb00.tar.gz
poi-c039da1b94a24224bcd7d6a09b1828782a2acb00.zip
#63028 - Provide font embedding for slideshows
git-svn-id: https://svn.apache.org/repos/asf/poi/trunk@1849898 13f79535-47bb-0310-9956-ffa450edef68
Diffstat (limited to 'src/java/org/apache/poi')
-rw-r--r--src/java/org/apache/poi/common/usermodel/fonts/FontCharset.java2
-rw-r--r--src/java/org/apache/poi/common/usermodel/fonts/FontFacet.java75
-rw-r--r--src/java/org/apache/poi/common/usermodel/fonts/FontHeader.java227
-rw-r--r--src/java/org/apache/poi/common/usermodel/fonts/FontInfo.java68
-rw-r--r--src/java/org/apache/poi/sl/draw/DrawFontInfo.java48
-rw-r--r--src/java/org/apache/poi/sl/extractor/SlideShowExtractor.java305
-rw-r--r--src/java/org/apache/poi/sl/usermodel/FontCollection.java22
-rw-r--r--src/java/org/apache/poi/sl/usermodel/Resources.java29
-rw-r--r--src/java/org/apache/poi/sl/usermodel/Slide.java3
-rw-r--r--src/java/org/apache/poi/sl/usermodel/SlideShow.java29
-rw-r--r--src/java/org/apache/poi/sl/usermodel/TextRun.java8
11 files changed, 585 insertions, 231 deletions
diff --git a/src/java/org/apache/poi/common/usermodel/fonts/FontCharset.java b/src/java/org/apache/poi/common/usermodel/fonts/FontCharset.java
index aeeca9284c..32915149f2 100644
--- a/src/java/org/apache/poi/common/usermodel/fonts/FontCharset.java
+++ b/src/java/org/apache/poi/common/usermodel/fonts/FontCharset.java
@@ -70,7 +70,7 @@ public enum FontCharset {
/** Specifies the Russian Cyrillic character set. */
RUSSIAN(0x000000CC, "Cp1251"),
/** Specifies the Thai character set. */
- THAI_(0x000000DE, "x-windows-874"),
+ THAI(0x000000DE, "x-windows-874"),
/** Specifies a Eastern European character set. */
EASTEUROPE(0x000000EE, "Cp1250"),
/**
diff --git a/src/java/org/apache/poi/common/usermodel/fonts/FontFacet.java b/src/java/org/apache/poi/common/usermodel/fonts/FontFacet.java
new file mode 100644
index 0000000000..5fb16908cd
--- /dev/null
+++ b/src/java/org/apache/poi/common/usermodel/fonts/FontFacet.java
@@ -0,0 +1,75 @@
+/* ====================================================================
+Licensed to the Apache Software Foundation (ASF) under one or more
+contributor license agreements. See the NOTICE file distributed with
+this work for additional information regarding copyright ownership.
+The ASF licenses this file to You under the Apache License, Version 2.0
+(the "License"); you may not use this file except in compliance with
+the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==================================================================== */
+
+package org.apache.poi.common.usermodel.fonts;
+
+import org.apache.poi.util.Beta;
+
+/**
+ * A FontFacet holds the font data for a shape of a font, i.e. a regular,
+ * italic, bold or bold-italic version of a Font.
+ */
+@SuppressWarnings("unused")
+@Beta
+public interface FontFacet {
+ /**
+ * Get the font weight.<p>
+ *
+ * The weight of the font in the range 0 through 1000.
+ * For example, 400 is normal and 700 is bold.
+ * If this value is zero, a default weight is used.
+ *
+ * @return the font weight
+ *
+ * @since POI 4.1.0
+ */
+ default int getWeight() {
+ return FontHeader.REGULAR_WEIGHT;
+ }
+
+ /**
+ * Set the font weight
+ *
+ * @param weight the font weight
+ */
+ default void setWeight(int weight) {
+ throw new UnsupportedOperationException("FontFacet is read-only.");
+ }
+
+ /**
+ * @return {@code true}, if the font is italic
+ */
+ default boolean isItalic() {
+ return false;
+ }
+
+ /**
+ * Set the font posture
+ *
+ * @param italic {@code true} for italic, {@code false} for regular
+ */
+ default void setItalic(boolean italic) {
+ throw new UnsupportedOperationException("FontFacet is read-only.");
+ }
+
+ /**
+ * @return the wrapper object holding the font data
+ */
+ default Object getFontData() {
+ return null;
+ }
+}
diff --git a/src/java/org/apache/poi/common/usermodel/fonts/FontHeader.java b/src/java/org/apache/poi/common/usermodel/fonts/FontHeader.java
new file mode 100644
index 0000000000..9777f0cc75
--- /dev/null
+++ b/src/java/org/apache/poi/common/usermodel/fonts/FontHeader.java
@@ -0,0 +1,227 @@
+/* ====================================================================
+ Licensed to the Apache Software Foundation (ASF) under one or more
+ contributor license agreements. See the NOTICE file distributed with
+ this work for additional information regarding copyright ownership.
+ The ASF licenses this file to You under the Apache License, Version 2.0
+ (the "License"); you may not use this file except in compliance with
+ the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+==================================================================== */
+
+package org.apache.poi.common.usermodel.fonts;
+
+import java.io.IOException;
+import java.io.InputStream;
+import java.nio.charset.StandardCharsets;
+
+import org.apache.poi.util.IOUtils;
+import org.apache.poi.util.LittleEndianByteArrayInputStream;
+import org.apache.poi.util.LittleEndianInput;
+import org.apache.poi.util.LittleEndianInputStream;
+
+
+/**
+ * The header data of an EOT font.<p>
+ *
+ * Currently only version 1 fields are read to identify a stream to be embedded.
+ *
+ * @see <a href="http://www.w3.org/Submission/EOT">Embedded OpenType (EOT) File Format</a>
+ */
+@SuppressWarnings({"FieldCanBeLocal", "unused", "Duplicates"})
+public class FontHeader implements FontInfo {
+ /**
+ * Fonts with a font weight of 400 are regarded as regular weighted.
+ * Higher font weights (up to 1000) are bold - lower weights are thin.
+ */
+ public static final int REGULAR_WEIGHT = 400;
+
+ private int eotSize;
+ private int fontDataSize;
+ private int version;
+ private int flags;
+ private final byte[] panose = new byte[10];
+ private byte charset;
+ private byte italic;
+ private int weight;
+ private int fsType;
+ private int magic;
+ private int unicodeRange1;
+ private int unicodeRange2;
+ private int unicodeRange3;
+ private int unicodeRange4;
+ private int codePageRange1;
+ private int codePageRange2;
+ private int checkSumAdjustment;
+ private String familyName;
+ private String styleName;
+ private String versionName;
+ private String fullName;
+
+ public void init(byte[] source, int offset, int length) {
+ init(new LittleEndianByteArrayInputStream(source, offset, length));
+ }
+
+ public void init(LittleEndianInput leis) {
+ eotSize = leis.readInt();
+ fontDataSize = leis.readInt();
+ version = leis.readInt();
+ if (version != 0x00010000 && version != 0x00020001 && version != 0x00020002) {
+ throw new RuntimeException("not a EOT font data stream");
+ }
+ flags = leis.readInt();
+ leis.readFully(panose);
+ charset = leis.readByte();
+ italic = leis.readByte();
+ weight = leis.readInt();
+ fsType = leis.readUShort();
+ magic = leis.readUShort();
+ if (magic != 0x504C) {
+ throw new RuntimeException("not a EOT font data stream");
+ }
+ unicodeRange1 = leis.readInt();
+ unicodeRange2 = leis.readInt();
+ unicodeRange3 = leis.readInt();
+ unicodeRange4 = leis.readInt();
+ codePageRange1 = leis.readInt();
+ codePageRange2 = leis.readInt();
+ checkSumAdjustment = leis.readInt();
+ int reserved1 = leis.readInt();
+ int reserved2 = leis.readInt();
+ int reserved3 = leis.readInt();
+ int reserved4 = leis.readInt();
+ familyName = readName(leis);
+ styleName = readName(leis);
+ versionName = readName(leis);
+ fullName = readName(leis);
+
+ }
+
+ public InputStream bufferInit(InputStream fontStream) throws IOException {
+ LittleEndianInputStream is = new LittleEndianInputStream(fontStream);
+ is.mark(1000);
+ init(is);
+ is.reset();
+ return is;
+ }
+
+ private String readName(LittleEndianInput leis) {
+ // padding
+ leis.readShort();
+ int nameSize = leis.readUShort();
+ byte[] nameBuf = IOUtils.safelyAllocate(nameSize, 1000);
+ leis.readFully(nameBuf);
+ // may be 0-terminated, just trim it away
+ return new String(nameBuf, 0, nameSize, StandardCharsets.UTF_16LE).trim();
+ }
+
+ public boolean isItalic() {
+ return italic != 0;
+ }
+
+ public int getWeight() {
+ return weight;
+ }
+
+ public boolean isBold() {
+ return getWeight() > REGULAR_WEIGHT;
+ }
+
+ public byte getCharsetByte() {
+ return charset;
+ }
+
+ public FontCharset getCharset() {
+ return FontCharset.valueOf(getCharsetByte());
+ }
+
+ public FontPitch getPitch() {
+ byte familyKind = panose[0];
+ switch (familyKind) {
+ default:
+ // Any
+ case 0:
+ // No Fit
+ case 1:
+ return FontPitch.VARIABLE;
+
+ // Latin Text
+ case 2:
+ // Latin Decorative
+ case 4:
+ byte proportion = panose[3];
+ return proportion == 9 ? FontPitch.FIXED : FontPitch.VARIABLE;
+
+ // Latin Hand Written
+ case 3:
+ // Latin Symbol
+ case 5:
+ byte spacing = panose[3];
+ return spacing == 3 ? FontPitch.FIXED : FontPitch.VARIABLE;
+ }
+
+ }
+
+ public FontFamily getFamily() {
+ switch (panose[0]) {
+ // Any
+ case 0:
+ // No Fit
+ case 1:
+ return FontFamily.FF_DONTCARE;
+ // Latin Text
+ case 2:
+ byte serifStyle = panose[1];
+ return (10 <= serifStyle && serifStyle <= 15)
+ ? FontFamily.FF_SWISS : FontFamily.FF_ROMAN;
+ // Latin Hand Written
+ case 3:
+ return FontFamily.FF_SCRIPT;
+ // Latin Decorative
+ default:
+ case 4:
+ return FontFamily.FF_DECORATIVE;
+ // Latin Symbol
+ case 5:
+ return FontFamily.FF_MODERN;
+ }
+ }
+
+ public String getFamilyName() {
+ return familyName;
+ }
+
+ public String getStyleName() {
+ return styleName;
+ }
+
+ public String getVersionName() {
+ return versionName;
+ }
+
+ public String getFullName() {
+ return fullName;
+ }
+
+ public byte[] getPanose() {
+ return panose;
+ }
+
+ @Override
+ public String getTypeface() {
+ return getFamilyName();
+ }
+
+ public int getFlags() {
+ return flags;
+ }
+}
+
+
+
diff --git a/src/java/org/apache/poi/common/usermodel/fonts/FontInfo.java b/src/java/org/apache/poi/common/usermodel/fonts/FontInfo.java
index ecb5a69687..b47b02e53b 100644
--- a/src/java/org/apache/poi/common/usermodel/fonts/FontInfo.java
+++ b/src/java/org/apache/poi/common/usermodel/fonts/FontInfo.java
@@ -17,6 +17,11 @@ limitations under the License.
package org.apache.poi.common.usermodel.fonts;
+import java.util.Collections;
+import java.util.List;
+
+import org.apache.poi.util.Beta;
+
/**
* A FontInfo object holds information about a font configuration.
* It is roughly an equivalent to the LOGFONT structure in Windows GDI.<p>
@@ -30,6 +35,7 @@ package org.apache.poi.common.usermodel.fonts;
*
* @see <a href="https://msdn.microsoft.com/en-us/library/dd145037.aspx">LOGFONT structure</a>
*/
+@SuppressWarnings("unused")
public interface FontInfo {
/**
@@ -37,7 +43,9 @@ public interface FontInfo {
* @return unique index number of the underlying record this Font represents
* (probably you don't care unless you're comparing which one is which)
*/
- Integer getIndex();
+ default Integer getIndex() {
+ return null;
+ }
/**
* Sets the index within the collection of Font objects
@@ -46,7 +54,9 @@ public interface FontInfo {
*
* @throws UnsupportedOperationException if unsupported
*/
- void setIndex(int index);
+ default void setIndex(int index) {
+ throw new UnsupportedOperationException("FontInfo is read-only.");
+ }
/**
@@ -60,36 +70,48 @@ public interface FontInfo {
* @param typeface the full name of the font, when {@code null} removes the font definition -
* removal is implementation specific
*/
- void setTypeface(String typeface);
+ default void setTypeface(String typeface) {
+ throw new UnsupportedOperationException("FontInfo is read-only.");
+ }
/**
* @return the font charset
*/
- FontCharset getCharset();
+ default FontCharset getCharset() {
+ return FontCharset.ANSI;
+ }
/**
* Sets the charset
*
* @param charset the charset
*/
- void setCharset(FontCharset charset);
+ default void setCharset(FontCharset charset) {
+ throw new UnsupportedOperationException("FontInfo is read-only.");
+ }
/**
* @return the family class
*/
- FontFamily getFamily();
+ default FontFamily getFamily() {
+ return FontFamily.FF_DONTCARE;
+ }
/**
* Sets the font family class
*
* @param family the font family class
*/
- void setFamily(FontFamily family);
+ default void setFamily(FontFamily family) {
+ throw new UnsupportedOperationException("FontInfo is read-only.");
+ }
/**
* @return the font pitch or {@code null} if unsupported
*/
- FontPitch getPitch();
+ default FontPitch getPitch() {
+ return null;
+ }
/**
* Set the font pitch
@@ -98,5 +120,33 @@ public interface FontInfo {
*
* @throws UnsupportedOperationException if unsupported
*/
- void setPitch(FontPitch pitch);
+ default void setPitch(FontPitch pitch) {
+ throw new UnsupportedOperationException("FontInfo is read-only.");
+ }
+
+ /**
+ * @return panose info in binary form or {@code null} if unknown
+ */
+ default byte[] getPanose() {
+ return null;
+ }
+
+ /**
+ * Set the panose in binary form
+ * @param panose the panose bytes
+ */
+ default void setPanose(byte[] panose) {
+ throw new UnsupportedOperationException("FontInfo is read-only.");
+ }
+
+
+ /**
+ * If font facets are embedded in the document, return the list of embedded facets.
+ * The font embedding is experimental, therefore the API can change.
+ * @return the list of embedded EOT font data
+ */
+ @Beta
+ default List<? extends FontFacet> getFacets() {
+ return Collections.emptyList();
+ }
} \ No newline at end of file
diff --git a/src/java/org/apache/poi/sl/draw/DrawFontInfo.java b/src/java/org/apache/poi/sl/draw/DrawFontInfo.java
index dc7afb4e24..da1979cb9e 100644
--- a/src/java/org/apache/poi/sl/draw/DrawFontInfo.java
+++ b/src/java/org/apache/poi/sl/draw/DrawFontInfo.java
@@ -19,10 +19,7 @@
package org.apache.poi.sl.draw;
-import org.apache.poi.common.usermodel.fonts.FontCharset;
-import org.apache.poi.common.usermodel.fonts.FontFamily;
import org.apache.poi.common.usermodel.fonts.FontInfo;
-import org.apache.poi.common.usermodel.fonts.FontPitch;
import org.apache.poi.util.Internal;
/**
@@ -38,52 +35,7 @@ import org.apache.poi.util.Internal;
}
@Override
- public Integer getIndex() {
- return null;
- }
-
- @Override
- public void setIndex(int index) {
- throw new UnsupportedOperationException("DrawFontManagers FontInfo can't be changed.");
- }
-
- @Override
public String getTypeface() {
return typeface;
}
-
- @Override
- public void setTypeface(String typeface) {
- throw new UnsupportedOperationException("DrawFontManagers FontInfo can't be changed.");
- }
-
- @Override
- public FontCharset getCharset() {
- return FontCharset.ANSI;
- }
-
- @Override
- public void setCharset(FontCharset charset) {
- throw new UnsupportedOperationException("DrawFontManagers FontInfo can't be changed.");
- }
-
- @Override
- public FontFamily getFamily() {
- return FontFamily.FF_SWISS;
- }
-
- @Override
- public void setFamily(FontFamily family) {
- throw new UnsupportedOperationException("DrawFontManagers FontInfo can't be changed.");
- }
-
- @Override
- public FontPitch getPitch() {
- return FontPitch.VARIABLE;
- }
-
- @Override
- public void setPitch(FontPitch pitch) {
- throw new UnsupportedOperationException("DrawFontManagers FontInfo can't be changed.");
- }
}
diff --git a/src/java/org/apache/poi/sl/extractor/SlideShowExtractor.java b/src/java/org/apache/poi/sl/extractor/SlideShowExtractor.java
index dee4d44a03..7173c24e97 100644
--- a/src/java/org/apache/poi/sl/extractor/SlideShowExtractor.java
+++ b/src/java/org/apache/poi/sl/extractor/SlideShowExtractor.java
@@ -18,10 +18,14 @@
package org.apache.poi.sl.extractor;
import java.util.ArrayList;
+import java.util.BitSet;
+import java.util.LinkedList;
import java.util.List;
+import java.util.function.Consumer;
+import java.util.function.Function;
+import java.util.function.Predicate;
import org.apache.poi.extractor.POITextExtractor;
-import org.apache.poi.sl.usermodel.Comment;
import org.apache.poi.sl.usermodel.MasterSheet;
import org.apache.poi.sl.usermodel.Notes;
import org.apache.poi.sl.usermodel.ObjectShape;
@@ -52,6 +56,10 @@ public class SlideShowExtractor<
> extends POITextExtractor {
private static final POILogger LOG = POILogFactory.getLogger(SlideShowExtractor.class);
+ // placeholder text for slide numbers
+ private static final String SLIDE_NUMBER_PH = "‹#›";
+
+
private SlideShow<S,P> slideshow;
private boolean slidesByDefault = true;
@@ -59,7 +67,8 @@ public class SlideShowExtractor<
private boolean commentsByDefault;
private boolean masterByDefault;
-
+ private Predicate<Object> filter = o -> true;
+
public SlideShowExtractor(final SlideShow<S,P> slideshow) {
setFilesystem(slideshow);
this.slideshow = slideshow;
@@ -115,9 +124,8 @@ public class SlideShowExtractor<
@Override
public String getText() {
final StringBuilder sb = new StringBuilder();
-
for (final Slide<S, P> slide : slideshow.getSlides()) {
- sb.append(getText(slide));
+ getText(slide, sb::append);
}
return sb.toString();
@@ -125,34 +133,37 @@ public class SlideShowExtractor<
public String getText(final Slide<S,P> slide) {
final StringBuilder sb = new StringBuilder();
+ getText(slide, sb::append);
+ return sb.toString();
+ }
+
+ private void getText(final Slide<S,P> slide, final Consumer<String> consumer) {
if (slidesByDefault) {
- printShapeText(slide, sb);
+ printShapeText(slide, consumer);
}
if (masterByDefault) {
final MasterSheet<S,P> ms = slide.getMasterSheet();
- printSlideMaster(ms, sb);
+ printSlideMaster(ms, consumer);
// only print slide layout, if it's a different instance
final MasterSheet<S,P> sl = slide.getSlideLayout();
if (sl != ms) {
- printSlideMaster(sl, sb);
+ printSlideMaster(sl, consumer);
}
}
if (commentsByDefault) {
- printComments(slide, sb);
+ printComments(slide, consumer);
}
if (notesByDefault) {
- printNotes(slide, sb);
+ printNotes(slide, consumer);
}
-
- return sb.toString();
}
- private void printSlideMaster(final MasterSheet<S,P> master, final StringBuilder sb) {
+ private void printSlideMaster(final MasterSheet<S,P> master, final Consumer<String> consumer) {
if (master == null) {
return;
}
@@ -163,163 +174,140 @@ public class SlideShowExtractor<
if (text == null || text.isEmpty() || "*".equals(text)) {
continue;
}
+
if (ts.isPlaceholder()) {
// don't bother about boiler plate text on master sheets
LOG.log(POILogger.INFO, "Ignoring boiler plate (placeholder) text on slide master:", text);
continue;
}
- sb.append(text);
- if (!text.endsWith("\n")) {
- sb.append("\n");
- }
+ printTextParagraphs(ts.getTextParagraphs(), consumer);
}
}
}
- private String printHeaderReturnFooter(final Sheet<S,P> sheet, final StringBuilder sb) {
- final Sheet<S, P> m = (sheet instanceof Slide) ? sheet.getMasterSheet() : sheet;
- final StringBuilder footer = new StringBuilder("\n");
- addSheetPlaceholderDatails(sheet, Placeholder.HEADER, sb);
- addSheetPlaceholderDatails(sheet, Placeholder.FOOTER, footer);
+ private void printTextParagraphs(final List<P> paras, final Consumer<String> consumer) {
+ printTextParagraphs(paras, consumer, "\n");
+ }
- if (masterByDefault) {
- // write header texts and determine footer text
- for (Shape<S, P> s : m) {
- if (!(s instanceof TextShape)) {
- continue;
- }
- final TextShape<S, P> ts = (TextShape<S, P>) s;
- final PlaceholderDetails pd = ts.getPlaceholderDetails();
- if (pd == null || !pd.isVisible() || pd.getPlaceholder() == null) {
- continue;
- }
- switch (pd.getPlaceholder()) {
- case HEADER:
- sb.append(ts.getText());
- sb.append('\n');
- break;
- case SLIDE_NUMBER:
- if (sheet instanceof Slide) {
- footer.append(ts.getText().replace("‹#›", Integer.toString(((Slide<S, P>) sheet).getSlideNumber() + 1)));
- footer.append('\n');
- }
- break;
- case FOOTER:
- footer.append(ts.getText());
- footer.append('\n');
- break;
- case DATETIME:
- // currently not supported
- default:
- break;
+
+ private void printTextParagraphs(final List<P> paras, final Consumer<String> consumer, String trailer) {
+ printTextParagraphs(paras, consumer, trailer, SlideShowExtractor::replaceTextCap);
+ }
+
+ private void printTextParagraphs(final List<P> paras, final Consumer<String> consumer, String trailer, final Function<TextRun,String> converter) {
+ for (P p : paras) {
+ for (TextRun r : p) {
+ if (filter.test(r)) {
+ consumer.accept(converter.apply(r));
}
}
+ if (!trailer.isEmpty() && filter.test(trailer)) {
+ consumer.accept(trailer);
+ }
}
-
- return (footer.length() > 1) ? footer.toString() : "";
}
- private void addSheetPlaceholderDatails(final Sheet<S,P> sheet, final Placeholder placeholder, final StringBuilder sb) {
- final PlaceholderDetails headerPD = sheet.getPlaceholderDetails(placeholder);
- if (headerPD == null) {
+ private void printHeaderFooter(final Sheet<S,P> sheet, final Consumer<String> consumer, final Consumer<String> footerCon) {
+ final Sheet<S, P> m = (sheet instanceof Slide) ? sheet.getMasterSheet() : sheet;
+ addSheetPlaceholderDatails(sheet, Placeholder.HEADER, consumer);
+ addSheetPlaceholderDatails(sheet, Placeholder.FOOTER, footerCon);
+
+ if (!masterByDefault) {
return;
}
- final String headerStr = headerPD.getText();
- if (headerStr == null) {
- return;
+
+ // write header texts and determine footer text
+ for (Shape<S, P> s : m) {
+ if (!(s instanceof TextShape)) {
+ continue;
+ }
+ final TextShape<S, P> ts = (TextShape<S, P>) s;
+ final PlaceholderDetails pd = ts.getPlaceholderDetails();
+ if (pd == null || !pd.isVisible() || pd.getPlaceholder() == null) {
+ continue;
+ }
+ switch (pd.getPlaceholder()) {
+ case HEADER:
+ printTextParagraphs(ts.getTextParagraphs(), consumer);
+ break;
+ case FOOTER:
+ printTextParagraphs(ts.getTextParagraphs(), footerCon);
+ break;
+ case SLIDE_NUMBER:
+ printTextParagraphs(ts.getTextParagraphs(), footerCon, "\n", SlideShowExtractor::replaceSlideNumber);
+ break;
+ case DATETIME:
+ // currently not supported
+ default:
+ break;
+ }
}
- sb.append(headerStr);
}
- private void printShapeText(final Sheet<S,P> sheet, final StringBuilder sb) {
- final String footer = printHeaderReturnFooter(sheet, sb);
- printShapeText((ShapeContainer<S,P>)sheet, sb);
- sb.append(footer);
+
+ private void addSheetPlaceholderDatails(final Sheet<S,P> sheet, final Placeholder placeholder, final Consumer<String> consumer) {
+ final PlaceholderDetails headerPD = sheet.getPlaceholderDetails(placeholder);
+ final String headerStr = (headerPD != null) ? headerPD.getText() : null;
+ if (headerStr != null && filter.test(headerPD)) {
+ consumer.accept(headerStr);
+ }
+ }
+
+ private void printShapeText(final Sheet<S,P> sheet, final Consumer<String> consumer) {
+ final List<String> footer = new LinkedList<>();
+ printHeaderFooter(sheet, consumer, footer::add);
+ printShapeText((ShapeContainer<S,P>)sheet, consumer);
+ footer.forEach(consumer);
}
@SuppressWarnings("unchecked")
- private void printShapeText(final ShapeContainer<S,P> container, final StringBuilder sb) {
+ private void printShapeText(final ShapeContainer<S,P> container, final Consumer<String> consumer) {
for (Shape<S,P> shape : container) {
if (shape instanceof TextShape) {
- printShapeText((TextShape<S,P>)shape, sb);
+ printTextParagraphs(((TextShape<S,P>)shape).getTextParagraphs(), consumer);
} else if (shape instanceof TableShape) {
- printShapeText((TableShape<S,P>)shape, sb);
+ printShapeText((TableShape<S,P>)shape, consumer);
} else if (shape instanceof ShapeContainer) {
- printShapeText((ShapeContainer<S,P>)shape, sb);
+ printShapeText((ShapeContainer<S,P>)shape, consumer);
}
}
}
- private void printShapeText(final TextShape<S,P> shape, final StringBuilder sb) {
- final List<P> paraList = shape.getTextParagraphs();
- if (paraList.isEmpty()) {
- sb.append('\n');
- return;
- }
- for (final P para : paraList) {
- for (final TextRun tr : para) {
- final String str = tr.getRawText().replace("\r", "");
- final String newStr;
- switch (tr.getTextCap()) {
- case ALL:
- newStr = str.toUpperCase(LocaleUtil.getUserLocale());
- break;
- case SMALL:
- newStr = str.toLowerCase(LocaleUtil.getUserLocale());
- break;
- default:
- case NONE:
- newStr = str;
- break;
- }
- sb.append(newStr);
- }
- sb.append('\n');
- }
- }
-
@SuppressWarnings("Duplicates")
- private void printShapeText(final TableShape<S,P> shape, final StringBuilder sb) {
+ private void printShapeText(final TableShape<S,P> shape, final Consumer<String> consumer) {
final int nrows = shape.getNumberOfRows();
final int ncols = shape.getNumberOfColumns();
- for (int row = 0; row < nrows; row++){
+ for (int row = 0; row < nrows; row++) {
+ String trailer = "";
for (int col = 0; col < ncols; col++){
TableCell<S, P> cell = shape.getCell(row, col);
//defensive null checks; don't know if they're necessary
- if (cell != null){
- String txt = cell.getText();
- txt = (txt == null) ? "" : txt;
- sb.append(txt);
- if (col < ncols-1){
- sb.append('\t');
- }
+ if (cell != null) {
+ trailer = col < ncols-1 ? "\t" : "\n";
+ printTextParagraphs(cell.getTextParagraphs(), consumer, trailer);
}
}
- sb.append('\n');
+ if (!trailer.equals("\n") && filter.test("\n")) {
+ consumer.accept("\n");
+ }
}
}
- private void printComments(final Slide<S,P> slide, final StringBuilder sb) {
- for (final Comment comment : slide.getComments()) {
- sb.append(comment.getAuthor());
- sb.append(" - ");
- sb.append(comment.getText());
- sb.append("\n");
- }
+ private void printComments(final Slide<S,P> slide, final Consumer<String> consumer) {
+ slide.getComments().stream().filter(filter).map(c -> c.getAuthor()+" - "+c.getText()).forEach(consumer);
}
- private void printNotes(final Slide<S,P> slide, final StringBuilder sb) {
+ private void printNotes(final Slide<S,P> slide, final Consumer<String> consumer) {
final Notes<S, P> notes = slide.getNotes();
if (notes == null) {
return;
}
- final String footer = printHeaderReturnFooter(notes, sb);
-
- printShapeText(notes, sb);
-
- sb.append(footer);
+ List<String> footer = new LinkedList<>();
+ printHeaderFooter(notes, consumer, footer::add);
+ printShapeText(notes, consumer);
+ footer.forEach(consumer);
}
public List<? extends ObjectShape<S,P>> getOLEShapes() {
@@ -342,4 +330,83 @@ public class SlideShowExtractor<
}
}
}
+
+ private static String replaceSlideNumber(TextRun tr) {
+ String raw = tr.getRawText();
+
+ if (!raw.contains(SLIDE_NUMBER_PH)) {
+ return raw;
+ }
+
+ TextParagraph tp = tr.getParagraph();
+ TextShape ps = (tp != null) ? tp.getParentShape() : null;
+ Sheet sh = (ps != null) ? ps.getSheet() : null;
+ String slideNr = (sh instanceof Slide) ? Integer.toString(((Slide)sh).getSlideNumber() + 1) : "";
+
+ return raw.replace(SLIDE_NUMBER_PH, slideNr);
+ }
+
+ private static String replaceTextCap(TextRun tr) {
+ final TextParagraph tp = tr.getParagraph();
+ final TextShape sh = (tp != null) ? tp.getParentShape() : null;
+ final Placeholder ph = (sh != null) ? sh.getPlaceholder() : null;
+
+ // 0xB acts like cariage return in page titles and like blank in the others
+ final char sep = (
+ ph == Placeholder.TITLE ||
+ ph == Placeholder.CENTERED_TITLE ||
+ ph == Placeholder.SUBTITLE
+ ) ? '\n' : ' ';
+
+ // PowerPoint seems to store files with \r as the line break
+ // The messes things up on everything but a Mac, so translate them to \n
+ String txt = tr.getRawText();
+ txt = txt.replace('\r', '\n');
+ txt = txt.replace((char) 0x0B, sep);
+
+ switch (tr.getTextCap()) {
+ case ALL:
+ txt = txt.toUpperCase(LocaleUtil.getUserLocale());
+ case SMALL:
+ txt = txt.toLowerCase(LocaleUtil.getUserLocale());
+ }
+
+ return txt;
+ }
+
+ /**
+ * Extract the used codepoints for font embedding / subsetting
+ * @param typeface the typeface/font family of the textruns to examine
+ * @param italic use {@code true} for italic TextRuns, {@code false} for non-italic ones and
+ * {@code null} if it doesn't matter
+ * @param bold use {@code true} for bold TextRuns, {@code false} for non-bold ones and
+ * {@code null} if it doesn't matter
+ * @return a bitset with the marked/used codepoints
+ */
+ public BitSet getCodepoints(String typeface, Boolean italic, Boolean bold) {
+ final BitSet glyphs = new BitSet();
+
+ Predicate<Object> filterOld = filter;
+ try {
+ filter = o -> filterFonts(o, typeface, italic, bold);
+ slideshow.getSlides().forEach(slide ->
+ getText(slide, s -> s.codePoints().forEach(glyphs::set))
+ );
+ } finally {
+ filter = filterOld;
+ }
+
+ return glyphs;
+ }
+
+ private static boolean filterFonts(Object o, String typeface, Boolean italic, Boolean bold) {
+ if (!(o instanceof TextRun)) {
+ return false;
+ }
+ TextRun tr = (TextRun)o;
+ return
+ typeface.equalsIgnoreCase(tr.getFontFamily()) &&
+ (italic == null || tr.isItalic() == italic) &&
+ (bold == null || tr.isBold() == bold);
+ }
}
diff --git a/src/java/org/apache/poi/sl/usermodel/FontCollection.java b/src/java/org/apache/poi/sl/usermodel/FontCollection.java
deleted file mode 100644
index 61278f4618..0000000000
--- a/src/java/org/apache/poi/sl/usermodel/FontCollection.java
+++ /dev/null
@@ -1,22 +0,0 @@
-/* ====================================================================
- Licensed to the Apache Software Foundation (ASF) under one or more
- contributor license agreements. See the NOTICE file distributed with
- this work for additional information regarding copyright ownership.
- The ASF licenses this file to You under the Apache License, Version 2.0
- (the "License"); you may not use this file except in compliance with
- the License. You may obtain a copy of the License at
-
- http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
-==================================================================== */
-
-package org.apache.poi.sl.usermodel;
-
-public interface FontCollection {
-
-}
diff --git a/src/java/org/apache/poi/sl/usermodel/Resources.java b/src/java/org/apache/poi/sl/usermodel/Resources.java
deleted file mode 100644
index 96170e50bd..0000000000
--- a/src/java/org/apache/poi/sl/usermodel/Resources.java
+++ /dev/null
@@ -1,29 +0,0 @@
-/* ====================================================================
- Licensed to the Apache Software Foundation (ASF) under one or more
- contributor license agreements. See the NOTICE file distributed with
- this work for additional information regarding copyright ownership.
- The ASF licenses this file to You under the Apache License, Version 2.0
- (the "License"); you may not use this file except in compliance with
- the License. You may obtain a copy of the License at
-
- http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
-==================================================================== */
-
-package org.apache.poi.sl.usermodel;
-
-/**
- * Common SlideShow resources, such as fonts, pictures
- * and multimedia data
- */
-public interface Resources {
- public FontCollection getFontCollection();
-
- public PictureData[] getPictureData();
- public int addPictureData(PictureData pict);
-}
diff --git a/src/java/org/apache/poi/sl/usermodel/Slide.java b/src/java/org/apache/poi/sl/usermodel/Slide.java
index 91b80f107e..7c0d566138 100644
--- a/src/java/org/apache/poi/sl/usermodel/Slide.java
+++ b/src/java/org/apache/poi/sl/usermodel/Slide.java
@@ -19,6 +19,7 @@ package org.apache.poi.sl.usermodel;
import java.util.List;
+@SuppressWarnings("unused")
public interface Slide<
S extends Shape<S,P>,
P extends TextParagraph<S,P,? extends TextRun>
@@ -82,7 +83,7 @@ public interface Slide<
*
* @since POI 4.0.0
*/
- MasterSheet getSlideLayout();
+ MasterSheet<S,P> getSlideLayout();
/**
* @return the slide name, defaults to "Slide[slideNumber]"
diff --git a/src/java/org/apache/poi/sl/usermodel/SlideShow.java b/src/java/org/apache/poi/sl/usermodel/SlideShow.java
index 175ad2b00e..751379de92 100644
--- a/src/java/org/apache/poi/sl/usermodel/SlideShow.java
+++ b/src/java/org/apache/poi/sl/usermodel/SlideShow.java
@@ -25,6 +25,7 @@ import java.io.InputStream;
import java.io.OutputStream;
import java.util.List;
+import org.apache.poi.common.usermodel.fonts.FontInfo;
import org.apache.poi.extractor.POITextExtractor;
import org.apache.poi.sl.usermodel.PictureData.PictureType;
@@ -44,8 +45,6 @@ public interface SlideShow<
*/
List<? extends MasterSheet<S,P>> getSlideMasters();
- Resources getResources();
-
/**
* Returns the current page size
*
@@ -135,4 +134,30 @@ public interface SlideShow<
* @since POI 4.0.0
*/
Object getPersistDocument();
+
+ /**
+ * Add an EOT font to the slideshow.
+ * An EOT or MTX font is a transformed True-Type (.ttf) or Open-Type (.otf) font.
+ * To transform a True-Type font use the sfntly library (see "see also" below)<p>
+ *
+ * (Older?) Powerpoint versions handle embedded fonts by converting them to .ttf files
+ * and put them into the Windows fonts directory. If the user is not allowed to install
+ * fonts, the slideshow can't be opened. While the slideshow is opened, its possible
+ * to copy the extracted .ttfs from the fonts directory. When the slideshow is closed,
+ * they will be removed.
+ *
+ * @param fontData the EOT font as stream
+ * @return the font info object containing the new font data
+ * @throws IOException if the fontData can't be saved or if the fontData is no EOT font
+ *
+ * @see <a href="http://www.w3.org/Submission/EOT">EOT specification</a>
+ * @see <a href="https://github.com/googlei18n/sfntly">googles sfntly library</a>
+ * @see <a href="https://github.com/kiwiwings/poi-font-mbender">Example on how to subset and embed fonts</a>
+ */
+ FontInfo addFont(InputStream fontData) throws IOException;
+
+ /**
+ * @return a list of registered fonts
+ */
+ List<? extends FontInfo> getFonts();
}
diff --git a/src/java/org/apache/poi/sl/usermodel/TextRun.java b/src/java/org/apache/poi/sl/usermodel/TextRun.java
index 394166071c..7dfd4933d8 100644
--- a/src/java/org/apache/poi/sl/usermodel/TextRun.java
+++ b/src/java/org/apache/poi/sl/usermodel/TextRun.java
@@ -27,6 +27,7 @@ import org.apache.poi.util.Internal;
/**
* Some text.
*/
+@SuppressWarnings("unused")
public interface TextRun {
/**
* Type of text capitals
@@ -243,4 +244,11 @@ public interface TextRun {
*/
@Internal
FieldType getFieldType();
+
+ /**
+ * @return the paragraph which contains this TextRun
+ *
+ * @since POI 4.1.0
+ */
+ TextParagraph<?,?,?> getParagraph();
}