/** returns current location pointer and sets to new value */ public void movePointer(final long pointer) { try { // make sure inside file if (pointer > pdf_datafile.length()) { if (LogWriter.isOutput()) { LogWriter.writeLog("Attempting to access ref outside file"); } // throw new PdfException("Exception moving file pointer - ref outside file"); } else { pdf_datafile.seek(pointer); } } catch (final Exception e) { if (LogWriter.isOutput()) { LogWriter.writeLog("Exception " + e + " moving pointer to " + pointer + " in file."); } } }
public Values() { String altSP = System.getProperty("org.jpedal.securityprovider"); try { if (altSP == null) { altSP = "/org/bouncycastle/"; } isEncryptOnClasspath = getClass().getResource(altSP) != null; } catch (final Exception e) { if (LogWriter.isOutput()) { LogWriter.writeLog("Exception in encryption " + e); } isEncryptOnClasspath = false; } catch (final Error e) { if (LogWriter.isOutput()) { LogWriter.writeLog("Exception in encryption " + e); } isEncryptOnClasspath = false; } }
/** update status if client being used also writes to log (called internally as file decoded) */ public final void updateStatus(String progress_bar, int debug_level_to_use) { current = progress_bar; // update status if in client if (showMessages == true) { SwingUtilities.invokeLater( new Runnable() { public void run() { status.setString(current); status.setValue(progress_size); } }); } if (debug_level > debug_level_to_use && LogWriter.isOutput()) LogWriter.writeLog(progress_bar); }
byte[] getBytes(final long start, final int count) { final byte[] buffer = new byte[count]; if (start >= 0) { try { pdf_datafile.seek(start); pdf_datafile.read(buffer); // get next chars } catch (final IOException e) { // tell user and log if (LogWriter.isOutput()) { LogWriter.writeLog("Exception: " + e.getMessage()); } // } } return buffer; }
/** * test first bytes to see if new 1.5 style table with obj or contains ref * * @throws PdfException */ private boolean isCompressedStream(int pointer, final int eof) throws PdfException { final boolean debug = false; int bufSize = 50, charReached_legacy = 0, charReached_comp1 = 0, charReached_comp2 = 0; final int[] objStm = {'O', 'b', 'j', 'S', 't', 'm'}; final int[] XRef = {'X', 'R', 'e', 'f'}; int type = UNSET; // flag to show if at start of data for check boolean firstRead = true; while (true) { /** adjust buffer if less than 1024 bytes left in file */ if (pointer + bufSize > eof) { bufSize = eof - pointer; } if (bufSize < 0) { bufSize = 50; } if (pointer < 0) { pointer += bufSize; continue; } final byte[] buffer = getBytes(pointer, bufSize); // allow for fact sometimes start of data wrong if (firstRead && buffer[0] == 'r' && buffer[1] == 'e' && buffer[2] == 'f') { charReached_legacy = 1; } firstRead = false; // switch off /** look for xref or obj */ for (int i = 0; i < bufSize; i++) { final byte currentByte = buffer[i]; if (debug) { System.out.print((char) currentByte); } /** check for xref OR end - reset if not */ if (currentByte == oldPattern[charReached_legacy] && type != COMPRESSED) { charReached_legacy++; type = LEGACY; } else if ((currentByte == objStm[charReached_comp1]) && (charReached_comp1 == 0 || type == COMPRESSED)) { charReached_comp1++; type = COMPRESSED; } else if ((currentByte == XRef[charReached_comp2]) && (charReached_comp2 == 0 || type == COMPRESSED)) { charReached_comp2++; type = COMPRESSED; } else { charReached_legacy = 0; charReached_comp1 = 0; charReached_comp2 = 0; type = UNSET; } if (charReached_legacy == 3 || charReached_comp1 == 4 || charReached_comp2 == 3) { break; } } if (charReached_legacy == 3 || charReached_comp1 == 4 || charReached_comp2 == 3) { break; } // update pointer pointer += bufSize; } /** throw exception if no match or tell user which type */ if (type == UNSET) { try { closeFile(); } catch (final IOException e1) { if (LogWriter.isOutput()) { LogWriter.writeLog("Exception " + 1 + " closing file " + e1); } } throw new PdfException("Exception unable to find ref or obj in trailer"); } return type == COMPRESSED; }
/** read first start ref from last 1024 bytes */ private int readFirstStartRef() throws PdfException { // reset flag offset.setRefTableInvalid(false); int pointer = -1; int i = 1019; final StringBuilder startRef = new StringBuilder(10); /** move to end of file and read last 1024 bytes */ final int block = 1024; byte[] lastBytes = new byte[block]; long end; /** set endpoint, losing null chars and anything before EOF */ final int[] EndOfFileMarker = {37, 37, 69, 79}; int valReached = 3; boolean EOFFound = false; try { end = eof; /** lose nulls and other trash from end of file */ final int bufSize = 255; while (true) { final byte[] buffer = getBytes(end - bufSize, bufSize); int offset = 0; for (int ii = bufSize - 1; ii > -1; ii--) { // see if we can decrement EOF tracker or restart check if (!EOFFound) { valReached = 3; } if (buffer[ii] == EndOfFileMarker[valReached]) { valReached--; EOFFound = true; } else { EOFFound = false; } // move to next byte offset--; if (valReached < 0) { ii = -1; } } // exit if found values on loop if (valReached < 0) { end -= offset; break; } else { end -= bufSize; } // allow for no eof if (end < 0) { end = eof; break; } } // end=end+bufSize; // allow for very small file int count = (int) (end - block); if (count < 0) { count = 0; final int size = (int) eof; lastBytes = new byte[size]; i = size + 3; // force reset below } lastBytes = getBytes(count, lastBytes.length); } catch (final Exception e) { if (LogWriter.isOutput()) { LogWriter.writeLog("Exception " + e + " reading last 1024 bytes"); } throw new PdfException(e + " reading last 1024 bytes"); } // for(int ii=0;ii<lastBytes.length;ii++){ // System.out.print((char)lastBytes[ii]); // } // System.out.println(); // look for tref as end of startxref final int fileSize = lastBytes.length; if (i > fileSize) { i = fileSize - 5; } while (i > -1) { // first check is because startref works as well a startxref !! if (((lastBytes[i] == 116 && lastBytes[i + 1] == 120) || (lastBytes[i] == 114 && lastBytes[i + 1] == 116)) && (lastBytes[i + 2] == 114) && (lastBytes[i + 3] == 101) && (lastBytes[i + 4] == 102)) { break; } i--; } /** trap buggy files */ if (i == -1) { try { closeFile(); } catch (final IOException e1) { if (LogWriter.isOutput()) { LogWriter.writeLog("Exception " + e1 + " closing file"); } } throw new PdfException("No Startxref found in last 1024 bytes "); } i += 5; // allow for word length // move to start of value ignoring spaces or returns while (i < 1024 && (lastBytes[i] == 10 || lastBytes[i] == 32 || lastBytes[i] == 13)) { i++; } // move to start of value ignoring spaces or returns while ((i < 1024) && (lastBytes[i] != 10) && (lastBytes[i] != 32) && (lastBytes[i] != 13)) { startRef.append((char) lastBytes[i]); i++; } /** convert xref to string to get pointer */ if (startRef.length() > 0) { pointer = Integer.parseInt(startRef.toString()); } if (pointer == -1) { if (LogWriter.isOutput()) { LogWriter.writeLog("No Startref found in last 1024 bytes "); } try { closeFile(); } catch (final IOException e1) { if (LogWriter.isOutput()) { LogWriter.writeLog("Exception " + e1 + " closing file"); } } throw new PdfException("No Startref found in last 1024 bytes "); } return pointer; }
/** read reference table from file so we can locate objects in pdf file and read the trailers */ private PdfObject readLegacyReferenceTable( PdfObject rootObj, int pointer, final int eof, final PdfFileReader currentPdfFile) throws PdfException { int endTable, current = 0; // current object number byte[] Bytes; int bufSize = 1024; /** read and decode 1 or more trailers */ while (true) { try { // allow for pointer outside file Bytes = Trailer.readTrailer(bufSize, pointer, eof, pdf_datafile); } catch (final Exception e) { try { closeFile(); } catch (final IOException e1) { if (LogWriter.isOutput()) { LogWriter.writeLog("Exception " + e + " closing file " + e1); } } throw new PdfException("Exception " + e + " reading trailer"); } if (Bytes == null) // safety catch { break; } /** get trailer */ int i = 0; final int maxLen = Bytes.length; // for(int a=0;a<100;a++) // System.out.println((char)Bytes[i+a]); while (i < maxLen) { // look for trailer keyword if (Bytes[i] == 116 && Bytes[i + 1] == 114 && Bytes[i + 2] == 97 && Bytes[i + 3] == 105 && Bytes[i + 4] == 108 && Bytes[i + 5] == 101 && Bytes[i + 6] == 114) { break; } i++; } // save endtable position for later endTable = i; if (i == Bytes.length) { break; } // move to beyond << while (Bytes[i] != 60 && Bytes[i - 1] != 60) { i++; } i++; final PdfObject pdfObject = new CompressedObject("1 0 R"); Dictionary.readDictionary(pdfObject, i, Bytes, -1, true, currentPdfFile, false); // move to beyond >> int level = 0; while (true) { if (Bytes[i] == 60 && Bytes[i - 1] == 60) { level++; i++; } else if (Bytes[i] == '[') { i++; while (Bytes[i] != ']') { i++; if (i == Bytes.length) { break; } } } else if (Bytes[i] == 62 && Bytes[i - 1] == 62) { level--; i++; } if (level == 0) { break; } i++; } // handle optional XRefStm final int XRefStm = pdfObject.getInt(PdfDictionary.XRefStm); if (XRefStm != -1) { pointer = XRefStm; } else { // usual way boolean hasRef = true; /** handle spaces and comments */ while (Bytes[i] == 10 || Bytes[i] == 13) { i++; } while (Bytes[i] == '%') { while (Bytes[i] != 10) { i++; } i++; } /* fix for /Users/markee/Downloads/oneiderapartnerbrochure_web_1371798737.pdf /**/ // look for xref as end of startref while (Bytes[i] != 116 && Bytes[i + 1] != 120 && Bytes[i + 2] != 114 && Bytes[i + 3] != 101 && Bytes[i + 4] != 102) { if (Bytes[i] == 'o' && Bytes[i + 1] == 'b' && Bytes[i + 2] == 'j') { hasRef = false; break; } i++; } if (hasRef) { i += 8; // move to start of value ignoring spaces or returns while ((i < maxLen) && (Bytes[i] == 10 || Bytes[i] == 32 || Bytes[i] == 13)) { i++; } final int s = i; // allow for characters between xref and startref while (i < maxLen && Bytes[i] != 10 && Bytes[i] != 32 && Bytes[i] != 13) { i++; } /** convert xref to string to get pointer */ if (s != i) { pointer = NumberUtils.parseInt(s, i, Bytes); } } } i = 0; // allow for bum data at start while (Bytes[i] == 13 || Bytes[i] == 10 || Bytes[i] == 9) { i++; } if (pointer == -1) { if (LogWriter.isOutput()) { LogWriter.writeLog("No startRef"); } /** now read the objects for the trailers */ } else if (Bytes[i] == 120 && Bytes[i + 1] == 114 && Bytes[i + 2] == 101 && Bytes[i + 3] == 102) { // make sure starts xref i = 5; // move to start of value ignoring spaces or returns while (Bytes[i] == 10 || Bytes[i] == 32 || Bytes[i] == 13) { i++; } current = offset.readXRefs(current, Bytes, endTable, i, eof, pdf_datafile); /** * now process trailer values - only first set of table values for root, encryption and info */ if (rootObj == null) { rootObj = pdfObject.getDictionary(PdfDictionary.Root); encryptObj = pdfObject.getDictionary(PdfDictionary.Encrypt); if (encryptObj != null) { final byte[][] IDs = pdfObject.getStringArray(PdfDictionary.ID); if (IDs != null && this.ID == null) { // only the first encountered ID should be used as a fileID for decryption this.ID = IDs[0]; } } infoObject = pdfObject.getDictionary(PdfDictionary.Info); } // make sure first values used if several tables and code for prev pointer = pdfObject.getInt(PdfDictionary.Prev); // see if other trailers if (pointer != -1 && pointer < this.eof) { // reset values for loop bufSize = 1024; // track ref table so we can work out object length offset.addXref(pointer); } else // reset if fails second test above { pointer = -1; } } else { pointer = -1; // needs to be read to pick up potential /Pages value //noinspection ObjectAllocationInLoop rootObj = new PageObject(BrokenRefTable.findOffsets(pdf_datafile, offset)); currentPdfFile.readObject(rootObj); offset.setRefTableInvalid(true); } if (pointer == -1) { break; } } if (encryptObj == null && rootObj != null) { // manual check for broken file (ignore if Encrypted) int type = -1; int status = rootObj.getStatus(); byte[] data = rootObj.getUnresolvedData(); try { final ObjectDecoder objectDecoder = new ObjectDecoder(currentPdfFile); objectDecoder.checkResolved(rootObj); type = rootObj.getParameterConstant(PdfDictionary.Type); } catch (Exception e) { // we need to ignore so just catch, put back as was and log rootObj.setStatus(status); rootObj.setUnresolvedData(data, status); if (LogWriter.isOutput()) { LogWriter.writeLog("[PDF] Exception reading type on root object " + e); } } // something gone wrong so manually index if (type == PdfDictionary.Font) { // see 21153 - ref table in wrong order rootObj = null; // /will reset in code at end } } // something gone wrong so manually index if (rootObj == null) { // see 21382 offset.clear(); offset.reuse(); // needs to be read to pick up potential /Pages value //noinspection ObjectAllocationInLoop rootObj = new PageObject(BrokenRefTable.findOffsets(pdf_datafile, offset)); currentPdfFile.readObject(rootObj); offset.setRefTableInvalid(true); } return rootObj; }
/** * read reference table start to see if new 1.5 type or traditional xref * * @throws PdfException */ public final PdfObject readReferenceTable( final PdfObject linearObj, final PdfFileReader currentPdfFile, final ObjectReader objectReader) throws PdfException { int pointer = -1; final int eof = (int) this.eof; boolean islinearizedCompressed = false; if (linearObj == null) { pointer = readFirstStartRef(); } else { // find at start of Linearized final byte[] data = pdf_datafile.getPdfBuffer(); final int count = data.length; int ptr = 5; for (int i = 0; i < count; i++) { // track start of this object (needed for compressed) if (data[i] == 'e' && data[i + 1] == 'n' && data[i + 2] == 'd' && data[i + 3] == 'o' && data[i + 4] == 'b' && data[i + 5] == 'j') { ptr = i + 6; } if (data[i] == 'x' && data[i + 1] == 'r' && data[i + 2] == 'e' && data[i + 3] == 'f') { pointer = i; i = count; } else if (data[i] == 'X' && data[i + 1] == 'R' && data[i + 2] == 'e' && data[i + 3] == 'f') { islinearizedCompressed = true; pointer = ptr; while (data[pointer] == 10 || data[pointer] == 13 || data[pointer] == 32) { pointer++; } i = count; } } } offset.addXref(pointer); PdfObject rootObj = null; if (pointer >= eof || pointer == 0) { if (LogWriter.isOutput()) { LogWriter.writeLog("Pointer not if file - trying to manually find startref"); } offset.setRefTableInvalid(true); try { rootObj = new PageObject(BrokenRefTable.findOffsets(pdf_datafile, offset)); } catch (Error err) { throw new PdfException(err.getMessage() + " attempting to manually scan file for objects"); } currentPdfFile.readObject(rootObj); return rootObj; } else if (islinearizedCompressed || isCompressedStream(pointer, eof)) { return readCompressedStream(rootObj, pointer, currentPdfFile, objectReader, linearObj); } else { return readLegacyReferenceTable(rootObj, pointer, eof, currentPdfFile); } }
/** * Run length decode. If both data and cached stream are present it will check they are identical */ @Override public void decode( final BufferedInputStream bis, final BufferedOutputStream streamCache, final String cacheName, final Map<String, String> cachedObjects) { this.bis = bis; this.streamCache = streamCache; this.cachedObjects = cachedObjects; try { final int count; int len; int nextLen; int value2; count = bis.available(); for (int i = 0; i < count; i++) { nextLen = bis.read(); if (nextLen >= 128) { nextLen -= 256; } len = nextLen; if (len < 0) { len = 256 + len; } if (len == 128) { i = count; } else if (len > 128) { i++; len = 257 - len; value2 = bis.read(); if (value2 >= 128) { value2 -= 256; } for (int j = 0; j < len; j++) { streamCache.write(value2); } } else { i++; len++; for (int j = 0; j < len; j++) { value2 = bis.read(); if (value2 >= 128) { value2 -= 256; } streamCache.write(value2); } i = i + len - 1; } } } catch (final IOException e1) { if (LogWriter.isOutput()) { LogWriter.writeLog("IO exception in RunLength " + e1); } } }