hslfslideshow.java
来自「EXCEL read and write」· Java 代码 · 共 569 行 · 第 1/2 页
JAVA
569 行
/* ==================================================================== Licensed to the Apache Software Foundation (ASF) under one or more contributor license agreements. See the NOTICE file distributed with this work for additional information regarding copyright ownership. The ASF licenses this file to You under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License.==================================================================== */package org.apache.poi.hslf;import java.io.ByteArrayInputStream;import java.io.ByteArrayOutputStream;import java.io.FileInputStream;import java.io.FileNotFoundException;import java.io.IOException;import java.io.InputStream;import java.io.OutputStream;import java.util.ArrayList;import java.util.Arrays;import java.util.HashMap;import java.util.Hashtable;import java.util.Iterator;import java.util.List;import org.apache.poi.POIDocument;import org.apache.poi.hslf.exceptions.CorruptPowerPointFileException;import org.apache.poi.hslf.exceptions.EncryptedPowerPointFileException;import org.apache.poi.hslf.exceptions.HSLFException;import org.apache.poi.hslf.record.*;import org.apache.poi.hslf.usermodel.ObjectData;import org.apache.poi.hslf.usermodel.PictureData;import org.apache.poi.poifs.filesystem.DirectoryNode;import org.apache.poi.poifs.filesystem.DocumentEntry;import org.apache.poi.poifs.filesystem.DocumentInputStream;import org.apache.poi.poifs.filesystem.POIFSFileSystem;import org.apache.poi.util.LittleEndian;import org.apache.poi.util.POILogFactory;import org.apache.poi.util.POILogger;/** * This class contains the main functionality for the Powerpoint file * "reader". It is only a very basic class for now * * @author Nick Burch */public final class HSLFSlideShow extends POIDocument { // For logging private POILogger logger = POILogFactory.getLogger(this.getClass()); // Holds metadata on where things are in our document private CurrentUserAtom currentUser; // Low level contents of the file private byte[] _docstream; // Low level contents private Record[] _records; // Raw Pictures contained in the pictures stream private PictureData[] _pictures; // Embedded objects stored in storage records in the document stream, lazily populated. private ObjectData[] _objects; /** * Returns the underlying POIFSFileSystem for the document * that is open. */ protected POIFSFileSystem getPOIFSFileSystem() { return filesystem; } /** * Constructs a Powerpoint document from fileName. Parses the document * and places all the important stuff into data structures. * * @param fileName The name of the file to read. * @throws IOException if there is a problem while parsing the document. */ public HSLFSlideShow(String fileName) throws IOException { this(new FileInputStream(fileName)); } /** * Constructs a Powerpoint document from an input stream. Parses the * document and places all the important stuff into data structures. * * @param inputStream the source of the data * @throws IOException if there is a problem while parsing the document. */ public HSLFSlideShow(InputStream inputStream) throws IOException { //do Ole stuff this(new POIFSFileSystem(inputStream)); } /** * Constructs a Powerpoint document from a POIFS Filesystem. Parses the * document and places all the important stuff into data structures. * * @param filesystem the POIFS FileSystem to read from * @throws IOException if there is a problem while parsing the document. */ public HSLFSlideShow(POIFSFileSystem filesystem) throws IOException { this(filesystem.getRoot(), filesystem); } /** * Constructs a Powerpoint document from a specific point in a * POIFS Filesystem. Parses the document and places all the * important stuff into data structures. * * @param dir the POIFS directory to read from * @param filesystem the POIFS FileSystem to read from * @throws IOException if there is a problem while parsing the document. */ public HSLFSlideShow(DirectoryNode dir, POIFSFileSystem filesystem) throws IOException { super(dir, filesystem); // First up, grab the "Current User" stream // We need this before we can detect Encrypted Documents readCurrentUserStream(); // Next up, grab the data that makes up the // PowerPoint stream readPowerPointStream(); // Check to see if we have an encrypted document, // bailing out if we do boolean encrypted = EncryptedSlideShow.checkIfEncrypted(this); if(encrypted) { throw new EncryptedPowerPointFileException("Encrypted PowerPoint files are not supported"); } // Now, build records based on the PowerPoint stream buildRecords(); // Look for Property Streams: readProperties(); // Look for any other streams readOtherStreams(); // Look for Picture Streams: readPictures(); } /** * Constructs a new, empty, Powerpoint document. */ public static final HSLFSlideShow create() { InputStream is = HSLFSlideShow.class.getResourceAsStream("data/empty.ppt"); if (is == null) { throw new RuntimeException("Missing resource 'empty.ppt'"); } try { return new HSLFSlideShow(is); } catch (IOException e) { throw new RuntimeException(e); } } /** * Extracts the main PowerPoint document stream from the * POI file, ready to be passed * * @throws IOException */ private void readPowerPointStream() throws IOException { // Get the main document stream DocumentEntry docProps = (DocumentEntry)directory.getEntry("PowerPoint Document"); // Grab the document stream _docstream = new byte[docProps.getSize()]; directory.createDocumentInputStream("PowerPoint Document").read(_docstream); } /** * Builds the list of records, based on the contents * of the PowerPoint stream */ private void buildRecords() { // The format of records in a powerpoint file are: // <little endian 2 byte "info"> // <little endian 2 byte "type"> // <little endian 4 byte "length"> // If it has a zero length, following it will be another record // <xx xx yy yy 00 00 00 00> <xx xx yy yy zz zz zz zz> // If it has a length, depending on its type it may have children or data // If it has children, these will follow straight away // <xx xx yy yy zz zz zz zz <xx xx yy yy zz zz zz zz>> // If it has data, this will come straigh after, and run for the length // <xx xx yy yy zz zz zz zz dd dd dd dd dd dd dd> // All lengths given exclude the 8 byte record header // (Data records are known as Atoms) // Document should start with: // 0F 00 E8 03 ## ## ## ## // (type 1000 = document, info 00 0f is normal, rest is document length) // 01 00 E9 03 28 00 00 00 // (type 1001 = document atom, info 00 01 normal, 28 bytes long) // 80 16 00 00 E0 10 00 00 xx xx xx xx xx xx xx xx // 05 00 00 00 0A 00 00 00 xx xx xx // (the contents of the document atom, not sure what it means yet) // (records then follow) // When parsing a document, look to see if you know about that type // of the current record. If you know it's a type that has children, // process the record's data area looking for more records // If you know about the type and it doesn't have children, either do // something with the data (eg TextRun) or skip over it // If you don't know about the type, play safe and skip over it (using // its length to know where the next record will start) // _records = read(_docstream, (int)currentUser.getCurrentEditOffset()); } private Record[] read(byte[] docstream, int usrOffset){ ArrayList lst = new ArrayList(); HashMap offset2id = new HashMap(); while (usrOffset != 0){ UserEditAtom usr = (UserEditAtom) Record.buildRecordAtOffset(docstream, usrOffset); lst.add(new Integer(usrOffset)); int psrOffset = usr.getPersistPointersOffset(); PersistPtrHolder ptr = (PersistPtrHolder)Record.buildRecordAtOffset(docstream, psrOffset); lst.add(new Integer(psrOffset)); Hashtable entries = ptr.getSlideLocationsLookup(); for (Iterator it = entries.keySet().iterator(); it.hasNext(); ) { Integer id = (Integer)it.next(); Integer offset = (Integer)entries.get(id); lst.add(offset); offset2id.put(offset, id); } usrOffset = usr.getLastUserEditAtomOffset(); } //sort found records by offset. //(it is not necessary but SlideShow.findMostRecentCoreRecords() expects them sorted) Object a[] = lst.toArray(); Arrays.sort(a); Record[] rec = new Record[lst.size()]; for (int i = 0; i < a.length; i++) { Integer offset = (Integer)a[i]; rec[i] = (Record)Record.buildRecordAtOffset(docstream, offset.intValue()); if(rec[i] instanceof PersistRecord) { PersistRecord psr = (PersistRecord)rec[i]; Integer id = (Integer)offset2id.get(offset); psr.setPersistId(id.intValue()); } } return rec; } /** * Find the "Current User" stream, and load it */ private void readCurrentUserStream() { try { currentUser = new CurrentUserAtom(directory); } catch(IOException ie) { logger.log(POILogger.ERROR, "Error finding Current User Atom:\n" + ie); currentUser = new CurrentUserAtom(); } } /** * Find any other streams from the filesystem, and load them */
⌨️ 快捷键说明
复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?