<changes>
<release version="3.8-beta5" date="2011-??-??">
- <action dev="poi-developers" type="add">51804 - include Master Slide text in XSLF text extraction</action>
+ <action dev="poi-developers" type="add">51804 - optionally include Master Slide text in XSLF text extraction, as HSLF already offers</action>
<action dev="poi-developers" type="add">New PackagePart method getRelatedPart(PackageRelationship) to simplify navigation of relations between OPC Parts</action>
<action dev="poi-developers" type="fix">51832 - handle XLS files where the WRITEPROTECT record preceeds the FILEPASS one, rather than following as normal</action>
<action dev="poi-developers" type="fix">51809 - correct GTE handling in COUNTIF</action>
private XMLSlideShow slideshow;
private boolean slidesByDefault = true;
private boolean notesByDefault = false;
+ private boolean masterByDefault = false;
public XSLFPowerPointExtractor(XMLSlideShow slideshow) {
super(slideshow);
this.notesByDefault = notesByDefault;
}
+ /**
+ * Should a call to getText() return text from master? Default is no
+ */
+ public void setMasterByDefault(boolean masterByDefault) {
+ this.masterByDefault = masterByDefault;
+ }
+
/**
* Gets the slide text, but not the notes text
*/
* @param notesText Should we retrieve text from notes?
*/
public String getText(boolean slideText, boolean notesText) {
+ return getText(slideText, notesText, masterByDefault);
+ }
+
+ /**
+ * Gets the requested text from the file
+ * @param slideText Should we retrieve text from slides?
+ * @param notesText Should we retrieve text from notes?
+ * @param masterText Should we retrieve text from master slides?
+ */
+ public String getText(boolean slideText, boolean notesText, boolean masterText) {
StringBuffer text = new StringBuffer();
XSLFSlide[] slides = slideshow.getSlides();
if (slideText) {
extractText(slide.getCommonSlideData(), text);
- // If there's a master sheet, grab text from there
- if(master != null) {
+ // If there's a master sheet and it's requested, grab text from there
+ if(masterText && master != null) {
extractText(master.getCommonSlideData(), text);
}
"Fifth level\n";
// Just slides, no notes
- text = extractor.getText(true, false);
+ text = extractor.getText(true, false, false);
assertEquals(
"Lorem ipsum dolor sit amet\n" +
"Nunc at risus vel erat tempus posuere. Aenean non ante.\n" +
"\n" +
- masterText +
- "\n\n\n" +
"Lorem ipsum dolor sit amet\n" +
"Lorem\n" +
"ipsum\n" +
"dolor\n" +
"sit\n" +
"amet\n" +
- "\n" +
- masterText +
- "\n\n\n"
+ "\n"
, text
);
);
// Both
- text = extractor.getText(true, true);
+ text = extractor.getText(true, true, false);
assertEquals(
"Lorem ipsum dolor sit amet\n" +
"Nunc at risus vel erat tempus posuere. Aenean non ante.\n" +
- "\n" +
- masterText +
- "\n\n\n\n\n" +
+ "\n\n\n" +
"Lorem ipsum dolor sit amet\n" +
"Lorem\n" +
"ipsum\n" +
"dolor\n" +
"sit\n" +
"amet\n" +
- "\n" +
- masterText +
- "\n\n\n\n\n"
+ "\n\n\n"
, text
);
+ // With Slides and Master Text
+ text = extractor.getText(true, false, true);
+ assertEquals(
+ "Lorem ipsum dolor sit amet\n" +
+ "Nunc at risus vel erat tempus posuere. Aenean non ante.\n" +
+ "\n" +
+ masterText +
+ "\n\n\n" +
+ "Lorem ipsum dolor sit amet\n" +
+ "Lorem\n" +
+ "ipsum\n" +
+ "dolor\n" +
+ "sit\n" +
+ "amet\n" +
+ "\n" +
+ masterText +
+ "\n\n\n"
+ , text
+ );
+
+ // With Slides, Notes and Master Text
+ text = extractor.getText(true, true, true);
+ assertEquals(
+ "Lorem ipsum dolor sit amet\n" +
+ "Nunc at risus vel erat tempus posuere. Aenean non ante.\n" +
+ "\n" +
+ masterText +
+ "\n\n\n\n\n" +
+ "Lorem ipsum dolor sit amet\n" +
+ "Lorem\n" +
+ "ipsum\n" +
+ "dolor\n" +
+ "sit\n" +
+ "amet\n" +
+ "\n" +
+ masterText +
+ "\n\n\n\n\n"
+ , text
+ );
+
// Via set defaults
extractor.setSlidesByDefault(false);
extractor.setNotesByDefault(true);
* @author Nick Burch
*/
public final class PowerPointExtractor extends POIOLE2TextExtractor {
- private HSLFSlideShow _hslfshow;
- private SlideShow _show;
- private Slide[] _slides;
-
- private boolean _slidesByDefault = true;
- private boolean _notesByDefault = false;
- private boolean _commentsByDefault = false;
- private boolean _masterByDefault = false;
+ private HSLFSlideShow _hslfshow;
+ private SlideShow _show;
+ private Slide[] _slides;
+
+ private boolean _slidesByDefault = true;
+ private boolean _notesByDefault = false;
+ private boolean _commentsByDefault = false;
+ private boolean _masterByDefault = false;
/**
* Basic extractor. Returns all the text, and optionally all the notes