PDFObjectStreamParserTest.java
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.pdfbox.pdfparser;
import static org.junit.jupiter.api.Assertions.assertEquals;
import java.io.IOException;
import java.io.OutputStream;
import java.util.Map;
import org.apache.pdfbox.cos.COSBase;
import org.apache.pdfbox.cos.COSBoolean;
import org.apache.pdfbox.cos.COSDocument;
import org.apache.pdfbox.cos.COSInteger;
import org.apache.pdfbox.cos.COSName;
import org.apache.pdfbox.cos.COSObjectKey;
import org.apache.pdfbox.cos.COSStream;
import org.junit.jupiter.api.Test;
/**
* Test for PDFObjectStreamParser.
*/
class PDFObjectStreamParserTest
{
@Test
void testOffsetParsing() throws IOException
{
COSStream stream = new COSStream();
stream.setItem(COSName.N, COSInteger.TWO);
stream.setItem(COSName.FIRST, COSInteger.get(8));
OutputStream outputStream = stream.createOutputStream();
outputStream.write("4 0 6 5 true false".getBytes());
outputStream.close();
PDFObjectStreamParser objectStreamParser = new PDFObjectStreamParser(stream, null);
Map<Long, Integer> objectNumbers = objectStreamParser.readObjectNumbers();
assertEquals(2, objectNumbers.size());
assertEquals(0, objectNumbers.get(4L));
assertEquals(5, objectNumbers.get(6L));
objectStreamParser = new PDFObjectStreamParser(stream, null);
assertEquals(COSBoolean.TRUE, objectStreamParser.parseObject(4));
objectStreamParser = new PDFObjectStreamParser(stream, null);
assertEquals(COSBoolean.FALSE, objectStreamParser.parseObject(6));
}
@Test
void testParseAllObjects() throws IOException
{
COSStream stream = new COSStream();
stream.setItem(COSName.N, COSInteger.TWO);
stream.setItem(COSName.FIRST, COSInteger.get(8));
OutputStream outputStream = stream.createOutputStream();
outputStream.write("6 0 4 5 true false".getBytes());
outputStream.close();
PDFObjectStreamParser objectStreamParser = new PDFObjectStreamParser(stream, null);
Map<COSObjectKey, COSBase> objectNumbers = objectStreamParser.parseAllObjects();
assertEquals(2, objectNumbers.size());
assertEquals(COSBoolean.TRUE, objectNumbers.get(new COSObjectKey(6, 0)));
assertEquals(COSBoolean.FALSE, objectNumbers.get(new COSObjectKey(4, 0)));
}
@Test
void testParseAllObjectsIndexed() throws IOException
{
COSStream stream = new COSStream();
stream.setItem(COSName.N, COSInteger.THREE);
stream.setItem(COSName.FIRST, COSInteger.get(13));
OutputStream outputStream = stream.createOutputStream();
// use object number 4 for two objects
outputStream.write("6 0 4 5 4 11 true false true".getBytes());
outputStream.close();
COSDocument cosDoc = new COSDocument();
Map<COSObjectKey, Long> xrefTable = cosDoc.getXrefTable();
// select the second object from the stream for object number 4 by using 2 as value for the index
xrefTable.put(new COSObjectKey(6, 0, 0), -1L);
xrefTable.put(new COSObjectKey(4, 0, 2), -1L);
PDFObjectStreamParser objectStreamParser = new PDFObjectStreamParser(stream, cosDoc);
Map<COSObjectKey, COSBase> objectNumbers = objectStreamParser.parseAllObjects();
assertEquals(2, objectNumbers.size());
assertEquals(COSBoolean.TRUE, objectNumbers.get(new COSObjectKey(6, 0)));
assertEquals(COSBoolean.TRUE, objectNumbers.get(new COSObjectKey(4, 0)));
// select the first object from the stream for object number 4 by using 1 as value for the index
// remove the old entry first to be sure it is replaced
xrefTable.remove(new COSObjectKey(4, 0));
xrefTable.put(new COSObjectKey(4, 0, 1), -1L);
objectStreamParser = new PDFObjectStreamParser(stream, cosDoc);
objectNumbers = objectStreamParser.parseAllObjects();
assertEquals(2, objectNumbers.size());
assertEquals(COSBoolean.TRUE, objectNumbers.get(new COSObjectKey(6, 0)));
assertEquals(COSBoolean.FALSE, objectNumbers.get(new COSObjectKey(4, 0)));
}
@Test
void testParseAllObjectsSkipMalformedIndex() throws IOException
{
COSStream stream = new COSStream();
stream.setItem(COSName.N, COSInteger.THREE);
stream.setItem(COSName.FIRST, COSInteger.get(13));
OutputStream outputStream = stream.createOutputStream();
outputStream.write("6 0 4 5 5 11 true false true".getBytes());
outputStream.close();
COSDocument cosDoc = new COSDocument();
Map<COSObjectKey, Long> xrefTable = cosDoc.getXrefTable();
// add an index for each object key which doesn't match with the index of the object stream
xrefTable.put(new COSObjectKey(6, 0, 10), -1L);
xrefTable.put(new COSObjectKey(4, 0, 11), -1L);
xrefTable.put(new COSObjectKey(5, 0, 12), -1L);
PDFObjectStreamParser objectStreamParser = new PDFObjectStreamParser(stream, cosDoc);
// the index isn't taken into account as all object numbers of the stream are unique
// none of the objects is skipped so that all objects are read and available
Map<COSObjectKey, COSBase> objectNumbers = objectStreamParser.parseAllObjects();
assertEquals(3, objectNumbers.size());
assertEquals(COSBoolean.TRUE, objectNumbers.get(new COSObjectKey(6, 0)));
assertEquals(COSBoolean.FALSE, objectNumbers.get(new COSObjectKey(4, 0)));
assertEquals(COSBoolean.TRUE, objectNumbers.get(new COSObjectKey(5, 0)));
}
@Test
void testParseAllObjectsUseMalformedIndex() throws IOException
{
COSStream stream = new COSStream();
stream.setItem(COSName.N, COSInteger.THREE);
stream.setItem(COSName.FIRST, COSInteger.get(13));
OutputStream outputStream = stream.createOutputStream();
outputStream.write("6 0 4 5 4 11 true false true".getBytes());
outputStream.close();
COSDocument cosDoc = new COSDocument();
Map<COSObjectKey, Long> xrefTable = cosDoc.getXrefTable();
// add an index for each object key which doesn't match with the index of the object stream
// add two object keys only as the object stream uses one object number for two objects
xrefTable.put(new COSObjectKey(6, 0, 10), -1L);
xrefTable.put(new COSObjectKey(4, 0, 11), -1L);
PDFObjectStreamParser objectStreamParser = new PDFObjectStreamParser(stream, cosDoc);
// as the used object numbers aren't unique within the object the index of the obejct keys is used
// All objects are dropped as the malformed index values don't match the index of the object within the stream
Map<COSObjectKey, COSBase> objectNumbers = objectStreamParser.parseAllObjects();
assertEquals(0, objectNumbers.size());
}
}