123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330 |
-
- /* ====================================================================
- Licensed to the Apache Software Foundation (ASF) under one or more
- contributor license agreements. See the NOTICE file distributed with
- this work for additional information regarding copyright ownership.
- The ASF licenses this file to You under the Apache License, Version 2.0
- (the "License"); you may not use this file except in compliance with
- the License. You may obtain a copy of the License at
-
- http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
- ==================================================================== */
-
-
- package org.apache.poi.poifs.eventfilesystem;
-
- import java.io.*;
-
- import java.util.*;
-
- import org.apache.poi.poifs.filesystem.DocumentInputStream;
- import org.apache.poi.poifs.filesystem.POIFSDocument;
- import org.apache.poi.poifs.filesystem.POIFSDocumentPath;
- import org.apache.poi.poifs.property.DirectoryProperty;
- import org.apache.poi.poifs.property.Property;
- import org.apache.poi.poifs.property.PropertyTable;
- import org.apache.poi.poifs.storage.BlockAllocationTableReader;
- import org.apache.poi.poifs.storage.BlockList;
- import org.apache.poi.poifs.storage.HeaderBlock;
- import org.apache.poi.poifs.storage.RawDataBlockList;
- import org.apache.poi.poifs.storage.SmallBlockTableReader;
-
- /**
- * An event-driven reader for POIFS file systems. Users of this class
- * first create an instance of it, then use the registerListener
- * methods to register POIFSReaderListener instances for specific
- * documents. Once all the listeners have been registered, the read()
- * method is called, which results in the listeners being notified as
- * their documents are read.
- *
- * @author Marc Johnson (mjohnson at apache dot org)
- */
-
- public class POIFSReader
- {
- private POIFSReaderRegistry registry;
- private boolean registryClosed;
-
- /**
- * Create a POIFSReader
- */
-
- public POIFSReader()
- {
- registry = new POIFSReaderRegistry();
- registryClosed = false;
- }
-
- /**
- * Read from an InputStream and process the documents we get
- *
- * @param stream the InputStream from which to read the data
- *
- * @exception IOException on errors reading, or on invalid data
- */
-
- public void read(final InputStream stream)
- throws IOException
- {
- registryClosed = true;
-
- // read the header block from the stream
- HeaderBlock header_block = new HeaderBlock(stream);
-
- // read the rest of the stream into blocks
- RawDataBlockList data_blocks = new RawDataBlockList(stream, header_block.getBigBlockSize());
-
- // set up the block allocation table (necessary for the
- // data_blocks to be manageable
- new BlockAllocationTableReader(header_block.getBigBlockSize(),
- header_block.getBATCount(),
- header_block.getBATArray(),
- header_block.getXBATCount(),
- header_block.getXBATIndex(),
- data_blocks);
-
- // get property table from the document
- PropertyTable properties =
- new PropertyTable(header_block, data_blocks);
-
- // process documents
- processProperties(SmallBlockTableReader
- .getSmallDocumentBlocks(
- header_block.getBigBlockSize(),
- data_blocks, properties.getRoot(),
- header_block.getSBATStart()),
- data_blocks, properties.getRoot()
- .getChildren(), new POIFSDocumentPath());
- }
-
- /**
- * Register a POIFSReaderListener for all documents
- *
- * @param listener the listener to be registered
- *
- * @exception NullPointerException if listener is null
- * @exception IllegalStateException if read() has already been
- * called
- */
-
- public void registerListener(final POIFSReaderListener listener)
- {
- if (listener == null)
- {
- throw new NullPointerException();
- }
- if (registryClosed)
- {
- throw new IllegalStateException();
- }
- registry.registerListener(listener);
- }
-
- /**
- * Register a POIFSReaderListener for a document in the root
- * directory
- *
- * @param listener the listener to be registered
- * @param name the document name
- *
- * @exception NullPointerException if listener is null or name is
- * null or empty
- * @exception IllegalStateException if read() has already been
- * called
- */
-
- public void registerListener(final POIFSReaderListener listener,
- final String name)
- {
- registerListener(listener, null, name);
- }
-
- /**
- * Register a POIFSReaderListener for a document in the specified
- * directory
- *
- * @param listener the listener to be registered
- * @param path the document path; if null, the root directory is
- * assumed
- * @param name the document name
- *
- * @exception NullPointerException if listener is null or name is
- * null or empty
- * @exception IllegalStateException if read() has already been
- * called
- */
-
- public void registerListener(final POIFSReaderListener listener,
- final POIFSDocumentPath path,
- final String name)
- {
- if ((listener == null) || (name == null) || (name.length() == 0))
- {
- throw new NullPointerException();
- }
- if (registryClosed)
- {
- throw new IllegalStateException();
- }
- registry.registerListener(listener,
- (path == null) ? new POIFSDocumentPath()
- : path, name);
- }
-
- /**
- * read in files
- *
- * @param args names of the files
- *
- * @exception IOException
- */
-
- public static void main(String args[])
- throws IOException
- {
- if (args.length == 0)
- {
- System.err
- .println("at least one argument required: input filename(s)");
- System.exit(1);
- }
-
- // register for all
- for (int j = 0; j < args.length; j++)
- {
- POIFSReader reader = new POIFSReader();
- POIFSReaderListener listener = new SampleListener();
-
- reader.registerListener(listener);
- System.out.println("reading " + args[ j ]);
- FileInputStream istream = new FileInputStream(args[ j ]);
-
- reader.read(istream);
- istream.close();
- }
- }
-
- private void processProperties(final BlockList small_blocks,
- final BlockList big_blocks,
- final Iterator properties,
- final POIFSDocumentPath path)
- throws IOException
- {
- while (properties.hasNext())
- {
- Property property = ( Property ) properties.next();
- String name = property.getName();
-
- if (property.isDirectory())
- {
- POIFSDocumentPath new_path = new POIFSDocumentPath(path,
- new String[]
- {
- name
- });
-
- processProperties(
- small_blocks, big_blocks,
- (( DirectoryProperty ) property).getChildren(), new_path);
- }
- else
- {
- int startBlock = property.getStartBlock();
- Iterator listeners = registry.getListeners(path, name);
-
- if (listeners.hasNext())
- {
- int size = property.getSize();
- POIFSDocument document = null;
-
- if (property.shouldUseSmallBlocks())
- {
- document =
- new POIFSDocument(name, small_blocks
- .fetchBlocks(startBlock, -1), size);
- }
- else
- {
- document =
- new POIFSDocument(name, big_blocks
- .fetchBlocks(startBlock, -1), size);
- }
- while (listeners.hasNext())
- {
- POIFSReaderListener listener =
- ( POIFSReaderListener ) listeners.next();
-
- listener.processPOIFSReaderEvent(
- new POIFSReaderEvent(
- new DocumentInputStream(document), path,
- name));
- }
- }
- else
- {
-
- // consume the document's data and discard it
- if (property.shouldUseSmallBlocks())
- {
- small_blocks.fetchBlocks(startBlock, -1);
- }
- else
- {
- big_blocks.fetchBlocks(startBlock, -1);
- }
- }
- }
- }
- }
-
- private static class SampleListener
- implements POIFSReaderListener
- {
-
- /**
- * Constructor SampleListener
- */
-
- SampleListener()
- {
- }
-
- /**
- * Method processPOIFSReaderEvent
- *
- * @param event
- */
-
- public void processPOIFSReaderEvent(final POIFSReaderEvent event)
- {
- DocumentInputStream istream = event.getStream();
- POIFSDocumentPath path = event.getPath();
- String name = event.getName();
-
- try
- {
- byte[] data = new byte[ istream.available() ];
-
- istream.read(data);
- int pathLength = path.length();
-
- for (int k = 0; k < pathLength; k++)
- {
- System.out.print("/" + path.getComponent(k));
- }
- System.out.println("/" + name + ": " + data.length
- + " bytes read");
- }
- catch (IOException ignored)
- {
- }
- }
- } // end private class SampleListener
- } // end public class POIFSReader
|