Coverage Report

Created: 2025-08-03 06:15

/src/qpdf/libqpdf/Pl_QPDFTokenizer.cc
Line
Count
Source
1
#include <qpdf/Pl_QPDFTokenizer.hh>
2
3
#include <qpdf/InputSource_private.hh>
4
#include <qpdf/Pipeline_private.hh>
5
#include <qpdf/QTC.hh>
6
7
#include <stdexcept>
8
9
using namespace qpdf;
10
11
class Pl_QPDFTokenizer::Members
12
{
13
  public:
14
2.73k
    Members() = default;
15
    Members(Members const&) = delete;
16
2.73k
    ~Members() = default;
17
18
    QPDFObjectHandle::TokenFilter* filter{nullptr};
19
    QPDFTokenizer tokenizer;
20
    std::string buffer;
21
    pl::String buf{"pl_tokenizer", nullptr, buffer};
22
};
23
24
Pl_QPDFTokenizer::Pl_QPDFTokenizer(
25
    char const* identifier, QPDFObjectHandle::TokenFilter* filter, Pipeline* next) :
26
2.73k
    Pipeline(identifier, next),
27
2.73k
    m(std::make_unique<Members>())
28
2.73k
{
29
2.73k
    m->filter = filter;
30
2.73k
    QPDFObjectHandle::TokenFilter::PipelineAccessor::setPipeline(m->filter, next);
31
2.73k
    m->tokenizer.allowEOF();
32
2.73k
    m->tokenizer.includeIgnorable();
33
2.73k
}
34
35
// Must be explicit and not inline -- see QPDF_DLL_CLASS in README-maintainer
36
2.73k
Pl_QPDFTokenizer::~Pl_QPDFTokenizer() = default;
37
38
void
39
Pl_QPDFTokenizer::write(unsigned char const* data, size_t len)
40
392k
{
41
392k
    m->buf.write(data, len);
42
392k
}
43
44
void
45
Pl_QPDFTokenizer::finish()
46
2.37k
{
47
2.37k
    auto input = is::OffsetBuffer("tokenizer data", m->buffer);
48
2.37k
    std::string empty;
49
31.2M
    while (true) {
50
31.2M
        auto token = m->tokenizer.readToken(input, empty, true);
51
31.2M
        m->filter->handleToken(token);
52
31.2M
        if (token.getType() == QPDFTokenizer::tt_eof) {
53
2.37k
            break;
54
31.2M
        } else if (token.isWord("ID")) {
55
            // Read the space after the ID.
56
1.60k
            char ch = ' ';
57
1.60k
            input.read(&ch, 1);
58
1.60k
            m->filter->handleToken(
59
                // line-break
60
1.60k
                QPDFTokenizer::Token(QPDFTokenizer::tt_space, std::string(1, ch)));
61
1.60k
            QTC::TC("qpdf", "Pl_QPDFTokenizer found ID");
62
1.60k
            m->tokenizer.expectInlineImage(input);
63
1.60k
        }
64
31.2M
    }
65
2.37k
    m->filter->handleEOF();
66
2.37k
    QPDFObjectHandle::TokenFilter::PipelineAccessor::setPipeline(m->filter, nullptr);
67
2.37k
    if (next()) {
68
2.37k
        next()->finish();
69
2.37k
    }
70
2.37k
}