textpiecetable.java

来自「EXCEL read and write」· Java 代码 · 共 273 行

JAVA
273
字号
/* ====================================================================   Licensed to the Apache Software Foundation (ASF) under one or more   contributor license agreements.  See the NOTICE file distributed with   this work for additional information regarding copyright ownership.   The ASF licenses this file to You under the Apache License, Version 2.0   (the "License"); you may not use this file except in compliance with   the License.  You may obtain a copy of the License at       http://www.apache.org/licenses/LICENSE-2.0   Unless required by applicable law or agreed to in writing, software   distributed under the License is distributed on an "AS IS" BASIS,   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.   See the License for the specific language governing permissions and   limitations under the License.==================================================================== */package org.apache.poi.hwpf.model;import org.apache.poi.hwpf.model.io.HWPFOutputStream;import org.apache.poi.poifs.common.POIFSConstants;import java.io.IOException;import java.io.UnsupportedEncodingException;import java.util.ArrayList;import java.util.Arrays;import java.util.Hashtable;import java.util.Iterator;import java.util.List;/** * The piece table for matching up character positions *  to bits of text. * This mostly works in bytes, but the TextPieces *  themselves work in characters. This does the icky *  convertion. * @author Ryan Ackley */public class TextPieceTable{  protected ArrayList _textPieces = new ArrayList();  //int _multiple;  int _cpMin;  public TextPieceTable() {  }  public TextPieceTable(byte[] documentStream, byte[] tableStream, int offset,                        int size, int fcMin)    throws UnsupportedEncodingException  {    // get our plex of PieceDescriptors    PlexOfCps pieceTable = new PlexOfCps(tableStream, offset, size, PieceDescriptor.getSizeInBytes());    int length = pieceTable.length();    PieceDescriptor[] pieces = new PieceDescriptor[length];    // iterate through piece descriptors raw bytes and create    // PieceDescriptor objects    for (int x = 0; x < length; x++)    {      GenericPropertyNode node = pieceTable.getProperty(x);      pieces[x] = new PieceDescriptor(node.getBytes(), 0);    }        // Figure out the cp of the earliest text piece    // Note that text pieces don't have to be stored in order!    _cpMin = pieces[0].getFilePosition() - fcMin;    for (int x = 0; x < pieces.length; x++) {    	int start = pieces[x].getFilePosition() - fcMin;    	if(start < _cpMin) {    		_cpMin = start;    	}    }    // using the PieceDescriptors, build our list of TextPieces.    for (int x = 0; x < pieces.length; x++)    {      int start = pieces[x].getFilePosition();      PropertyNode node = pieceTable.getProperty(x);            // Grab the start and end, which are in characters      int nodeStartChars = node.getStart();      int nodeEndChars = node.getEnd();            // What's the relationship between bytes and characters?      boolean unicode = pieces[x].isUnicode();      int multiple = 1;      if (unicode) {        multiple = 2;      }            // Figure out the length, in bytes and chars      int textSizeChars = (nodeEndChars - nodeStartChars);      int textSizeBytes = textSizeChars * multiple;      // Grab the data that makes up the piece      byte[] buf = new byte[textSizeBytes];      System.arraycopy(documentStream, start, buf, 0, textSizeBytes);      // And now build the piece      _textPieces.add(new TextPiece(nodeStartChars, nodeEndChars, buf, pieces[x], node.getStart()));    }        // In the interest of our sanity, now sort the text pieces    //  into order, if they're not already    TextPiece[] tp = (TextPiece[])    	_textPieces.toArray(new TextPiece[_textPieces.size()]);    Arrays.sort(tp);    for(int i=0; i<tp.length; i++) {    	_textPieces.set(i, tp[i]);    }  }  public int getCpMin()  {    return _cpMin;  }  public List getTextPieces()  {    return _textPieces;  }    /**   * Is the text at the given Character offset   *  unicode, or plain old ascii?   * In a very evil fashion, you have to actually    *  know this to make sense of character and   *  paragraph properties :(   * @param cp The character offset to check about   */  public boolean isUnicodeAtCharOffset(int cp) {	  boolean lastWas = false;	  	  Iterator it = _textPieces.iterator();	  while(it.hasNext()) {		  TextPiece tp = (TextPiece)it.next();		  // If the text piece covers the character, all good		  if(tp.getStart() <= cp && tp.getEnd() >= cp) {			  return tp.isUnicode();		  }		  // Otherwise keep track for the last one		  lastWas = tp.isUnicode();	  }	  	  // If they ask off the end, just go with the last one...	  return lastWas;  }  /**   * Is the text at the given byte offset   *  unicode, or plain old ascii?   * In a very evil fashion, you have to actually    *  know this to make sense of character and   *  paragraph properties :(   * @param cp The character offset to check about   */  public boolean isUnicodeAtByteOffset(int bytePos) {	  boolean lastWas = false;	  int curByte = 0;	  	  Iterator it = _textPieces.iterator();	  while(it.hasNext()) {		  TextPiece tp = (TextPiece)it.next();		  int nextByte = curByte + tp.bytesLength();		  		  // If the text piece covers the character, all good		  if(curByte <= bytePos && nextByte >= bytePos) {			  return tp.isUnicode();		  }		  // Otherwise keep track for the last one		  lastWas = tp.isUnicode();		  // Move along		  curByte = nextByte;	  }	  	  // If they ask off the end, just go with the last one...	  return lastWas;  }  public byte[] writeTo(HWPFOutputStream docStream)    throws IOException  {    PlexOfCps textPlex = new PlexOfCps(PieceDescriptor.getSizeInBytes());    //int fcMin = docStream.getOffset();    int size = _textPieces.size();    for (int x = 0; x < size; x++)    {      TextPiece next = (TextPiece)_textPieces.get(x);      PieceDescriptor pd = next.getPieceDescriptor();      int offset = docStream.getOffset();      int mod = (offset % POIFSConstants.BIG_BLOCK_SIZE);      if (mod != 0)      {        mod = POIFSConstants.BIG_BLOCK_SIZE - mod;        byte[] buf = new byte[mod];        docStream.write(buf);      }      // set the text piece position to the current docStream offset.      pd.setFilePosition(docStream.getOffset());      // write the text to the docstream and save the piece descriptor to the      // plex which will be written later to the tableStream.      docStream.write(next.getRawBytes());      // The TextPiece is already in characters, which      //  makes our life much easier      int nodeStart = next.getStart();      int nodeEnd = next.getEnd();      textPlex.addProperty(new GenericPropertyNode(nodeStart, nodeEnd,        pd.toByteArray()));    }    return textPlex.toByteArray();  }  /**   * Adjust all the text piece after inserting   *  some text into one of them   * @param listIndex The TextPiece that had characters inserted into   * @param length The number of characters inserted   */  public int adjustForInsert(int listIndex, int length) {    int size = _textPieces.size();    TextPiece tp = (TextPiece)_textPieces.get(listIndex);        // Update with the new end    tp.setEnd(tp.getEnd() + length);        // Now change all subsequent ones    for (int x = listIndex + 1; x < size; x++)    {      tp = (TextPiece)_textPieces.get(x);      tp.setStart(tp.getStart() + length);      tp.setEnd(tp.getEnd() + length);    }        // All done    return length;  }  public boolean equals(Object o)  {    TextPieceTable tpt = (TextPieceTable)o;    int size = tpt._textPieces.size();    if (size == _textPieces.size())    {      for (int x = 0; x < size; x++)      {        if (!tpt._textPieces.get(x).equals(_textPieces.get(x)))        {          return false;        }      }      return true;    }    return false;  }}

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?