Coverage Report

Created: 2026-04-01 07:17

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/ghostpdl/pdf/pdf_dict.c
Line
Count
Source
1
/* Copyright (C) 2018-2026 Artifex Software, Inc.
2
   All Rights Reserved.
3
4
   This software is provided AS-IS with no warranty, either express or
5
   implied.
6
7
   This software is distributed under license and may not be copied,
8
   modified or distributed except as expressly authorized under the terms
9
   of the license contained in the file LICENSE in this distribution.
10
11
   Refer to licensing information at http://www.artifex.com or contact
12
   Artifex Software, Inc.,  39 Mesa Street, Suite 108A, San Francisco,
13
   CA 94129, USA, for further information.
14
*/
15
16
/* dictionary handling for the PDF interpreter */
17
#include "ghostpdf.h"
18
#include "pdf_types.h"
19
#include "pdf_deref.h"
20
#include "pdf_dict.h"
21
#include "pdf_stack.h"
22
#include "pdf_array.h"
23
#include "pdf_int.h"
24
#include "pdf_loop_detect.h"
25
#include "pdf_misc.h"
26
27
static int pdfi_dict_find(pdf_context *ctx, pdf_dict *d, const char *Key, bool sort);
28
static int pdfi_dict_find_key(pdf_context *ctx, pdf_dict *d, const pdf_name *Key, bool sort);
29
30
void pdfi_free_dict(pdf_obj *o)
31
11.8M
{
32
11.8M
    pdf_dict *d = (pdf_dict *)o;
33
11.8M
    int i;
34
#if DEBUG_DICT
35
    pdf_name *name;
36
#endif
37
38
114M
    for (i=0;i < d->entries;i++) {
39
#if DEBUG_DICT
40
        name = (pdf_name *)d->list[i].key;
41
#endif
42
102M
        if (d->list[i].value != NULL)
43
102M
            pdfi_countdown(d->list[i].value);
44
102M
        if (d->list[i].key != NULL)
45
102M
            pdfi_countdown(d->list[i].key);
46
102M
    }
47
11.8M
    gs_free_object(OBJ_MEMORY(d), d->list, "pdf interpreter free dictionary key/values");
48
11.8M
    gs_free_object(OBJ_MEMORY(d), d, "pdf interpreter free dictionary");
49
11.8M
}
50
51
/* Delete a key pair, either by specifying a char * or a pdf_name *
52
 */
53
static int pdfi_dict_delete_inner(pdf_context *ctx, pdf_dict *d, pdf_name *n, const char *str)
54
218k
{
55
218k
    int i = 0;
56
#if DEBUG_DICT
57
    pdf_name *name;
58
#endif
59
60
218k
    if (n != NULL)
61
52.4k
        i = pdfi_dict_find_key(ctx, d, (const pdf_name *)n, false);
62
166k
    else
63
166k
        i = pdfi_dict_find(ctx, d, str, false);
64
65
218k
    if (i < 0)
66
52
        return i;
67
68
218k
    pdfi_countdown(d->list[i].key);
69
218k
    pdfi_countdown(d->list[i].value);
70
218k
    d->entries--;
71
218k
    if (i != d->entries)
72
59.3k
        memmove(&d->list[i], &d->list[i+1], (d->entries - i) * sizeof(d->list[0]));
73
218k
    d->list[d->entries].key = NULL;
74
218k
    d->list[d->entries].value = NULL;
75
218k
    d->is_sorted = false;
76
218k
    return 0;
77
218k
}
78
79
int pdfi_dict_delete_pair(pdf_context *ctx, pdf_dict *d, pdf_name *n)
80
52.4k
{
81
52.4k
    return pdfi_dict_delete_inner(ctx, d, n, NULL);
82
52.4k
}
83
84
int pdfi_dict_delete(pdf_context *ctx, pdf_dict *d, const char *str)
85
166k
{
86
166k
    return pdfi_dict_delete_inner(ctx, d, NULL, str);
87
166k
}
88
89
/* This function is provided for symmetry with arrays, and in case we ever
90
 * want to change the behaviour of pdfi_dict_from_stack() and pdfi_dict_alloc()
91
 * similarly to the array behaviour, where we always have null PDF objects
92
 * rather than NULL pointers stored in the dictionary.
93
 */
94
int pdfi_dict_alloc(pdf_context *ctx, uint64_t size, pdf_dict **d)
95
11.8M
{
96
11.8M
    *d = NULL;
97
11.8M
    return pdfi_object_alloc(ctx, PDF_DICT, size, (pdf_obj **)d);
98
11.8M
}
99
100
static int pdfi_dict_name_from_string(pdf_context *ctx, pdf_string *s, pdf_name **n)
101
0
{
102
0
    int code = pdfi_object_alloc(ctx, PDF_NAME, s->length, (pdf_obj **)n);
103
0
    if (code >= 0) {
104
0
        memcpy((*n)->data, s->data, s->length);
105
0
        pdfi_countup(*n);
106
0
    }
107
0
    return code;
108
0
}
109
110
int pdfi_dict_from_stack(pdf_context *ctx, uint32_t indirect_num, uint32_t indirect_gen, bool convert_string_keys)
111
11.0M
{
112
11.0M
    uint64_t index = 0;
113
11.0M
    pdf_dict *d = NULL;
114
11.0M
    uint64_t i = 0;
115
11.0M
    int code;
116
#if DEBUG_DICT
117
    pdf_name *key;
118
#endif
119
120
11.0M
    code = pdfi_count_to_mark(ctx, &index);
121
11.0M
    if (code < 0) {
122
138k
        pdfi_clear_to_mark(ctx);
123
138k
        return code;
124
138k
    }
125
126
10.9M
    if (index & 1) {
127
220k
        pdfi_clear_to_mark(ctx);
128
220k
        return_error(gs_error_rangecheck);
129
220k
    }
130
131
10.6M
    code = pdfi_dict_alloc(ctx, index >> 1, &d);
132
10.6M
    if (code < 0) {
133
0
        pdfi_clear_to_mark(ctx);
134
0
        return code;
135
0
    }
136
137
10.6M
    d->entries = d->size;
138
139
63.4M
    while (index) {
140
52.7M
        i = (index / 2) - 1;
141
142
        /* In PDF keys are *required* to be names, so we ought to check that here */
143
52.7M
        if (pdfi_type_of((pdf_obj *)ctx->stack_top[-2]) == PDF_NAME) {
144
52.7M
            d->list[i].key = ctx->stack_top[-2];
145
52.7M
            pdfi_countup(d->list[i].key);
146
#if DEBUG_DICT
147
            key = (pdf_name *)d->list[i].key;
148
#endif
149
52.7M
            d->list[i].value = ctx->stack_top[-1];
150
52.7M
            pdfi_countup(d->list[i].value);
151
52.7M
        } else {
152
44.1k
            if (convert_string_keys && (pdfi_type_of((pdf_obj *)ctx->stack_top[-2]) == PDF_STRING)) {
153
0
                pdf_name *n;
154
0
                code = pdfi_dict_name_from_string(ctx, (pdf_string *)ctx->stack_top[-2], &n);
155
0
                if (code < 0) {
156
0
                    pdfi_free_dict((pdf_obj *)d);
157
0
                    pdfi_clear_to_mark(ctx);
158
0
                    return_error(gs_error_typecheck);
159
0
                }
160
0
                d->list[i].key = (pdf_obj *)n; /* pdfi_dict_name_from_string() sets refcnt to 1 */
161
0
                d->list[i].value = ctx->stack_top[-1];
162
0
                pdfi_countup(d->list[i].value);
163
0
            }
164
44.1k
            else {
165
44.1k
                pdfi_free_dict((pdf_obj *)d);
166
44.1k
                pdfi_clear_to_mark(ctx);
167
44.1k
                return_error(gs_error_typecheck);
168
44.1k
            }
169
44.1k
        }
170
171
52.7M
        pdfi_pop(ctx, 2);
172
52.7M
        index -= 2;
173
52.7M
    }
174
175
10.6M
    code = pdfi_clear_to_mark(ctx);
176
10.6M
    if (code < 0) {
177
0
        pdfi_free_dict((pdf_obj *)d);
178
0
        return code;
179
0
    }
180
181
10.6M
    if (ctx->args.pdfdebug)
182
0
        outprintf (ctx->memory, "\n >>\n");
183
184
10.6M
    d->indirect_num = indirect_num;
185
10.6M
    d->indirect_gen = indirect_gen;
186
187
10.6M
    code = pdfi_push(ctx, (pdf_obj *)d);
188
10.6M
    if (code < 0)
189
0
        pdfi_free_dict((pdf_obj *)d);
190
191
10.6M
    return code;
192
10.6M
}
193
194
/* Convenience routine for common case where there are two possible keys */
195
int
196
pdfi_dict_get2(pdf_context *ctx, pdf_dict *d, const char *Key1,
197
               const char *Key2, pdf_obj **o)
198
1.50M
{
199
1.50M
    int code;
200
201
    /* ISO 32000-2:2020 (PDF 2.0) - abbreviated names take precendence. Assume abbreviated names are shorter :-) */
202
1.50M
    if (strlen(Key1) < strlen(Key2)) {
203
0
        code = pdfi_dict_get(ctx, d, Key1, o);
204
0
        if (code == gs_error_undefined)
205
0
            code = pdfi_dict_get(ctx, d, Key2, o);
206
1.50M
    } else {
207
1.50M
        code = pdfi_dict_get(ctx, d, Key2, o);
208
1.50M
        if (code == gs_error_undefined)
209
1.22M
            code = pdfi_dict_get(ctx, d, Key1, o);
210
1.50M
    }
211
1.50M
    return code;
212
1.50M
}
213
214
static int pdfi_dict_compare_entry(const void *a, const void *b)
215
1.16G
{
216
1.16G
    pdf_name *key_a = (pdf_name *)((pdf_dict_entry *)a)->key, *key_b = (pdf_name *)((pdf_dict_entry *)b)->key;
217
218
1.16G
    if (key_a == NULL) {
219
679k
        if (key_b == NULL)
220
679k
            return 0;
221
0
        else
222
0
            return 1;
223
679k
    }
224
225
1.16G
    if (key_b == NULL)
226
124k
        return -1;
227
228
1.16G
    if (key_a->length != key_b->length)
229
370M
        return key_a->length - key_b->length;
230
231
791M
    return strncmp((const char *)key_a->data, (const char *)key_b->data, key_a->length);
232
1.16G
}
233
234
static int pdfi_dict_find_sorted(pdf_context *ctx, pdf_dict *d, const char *Key)
235
87.9M
{
236
87.9M
    int start = 0, end = d->size - 1, middle = 0, keylen = strlen(Key);
237
87.9M
    pdf_name *test_key;
238
239
760M
    while (start <= end) {
240
756M
        middle = start + (end - start) / 2;
241
756M
        test_key = (pdf_name *)d->list[middle].key;
242
243
        /* Sorting pushes unused key/values (NULL) to the end of the dictionary */
244
756M
        if (test_key == NULL) {
245
474k
            end = middle - 1;
246
474k
            continue;
247
474k
        }
248
249
756M
        if (test_key->length == keylen) {
250
485M
            int result = strncmp((const char *)test_key->data, Key, keylen);
251
252
485M
            if (result == 0)
253
84.9M
                return middle;
254
400M
            if (result < 0)
255
205M
                start = middle + 1;
256
194M
            else
257
194M
                end = middle - 1;
258
400M
        } else {
259
271M
            if (test_key->length < keylen)
260
112M
                start = middle + 1;
261
159M
            else
262
159M
                end = middle -1;
263
271M
        }
264
756M
    }
265
3.06M
    return gs_note_error(gs_error_undefined);
266
87.9M
}
267
268
static int pdfi_dict_find_unsorted(pdf_context *ctx, pdf_dict *d, const char *Key)
269
148M
{
270
148M
    int i;
271
148M
    pdf_name *t;
272
273
20.4G
    for (i=0;i< d->entries;i++) {
274
20.3G
        t = (pdf_name *)d->list[i].key;
275
276
20.3G
        if (t && pdfi_type_of(t) == PDF_NAME) {
277
20.3G
            if (pdfi_name_is((pdf_name *)t, Key)) {
278
54.2M
                return i;
279
54.2M
            }
280
20.3G
        }
281
20.3G
    }
282
148M
    return_error(gs_error_undefined);
283
148M
}
284
285
static int pdfi_dict_find(pdf_context *ctx, pdf_dict *d, const char *Key, bool sort)
286
236M
{
287
236M
    if (!d->is_sorted) {
288
149M
        if (d->entries > 32 && sort) {
289
332k
            qsort(d->list, d->size, sizeof(pdf_dict_entry), pdfi_dict_compare_entry);
290
332k
            d->is_sorted = true;
291
332k
            return pdfi_dict_find_sorted(ctx, d, Key);
292
332k
        } else
293
148M
            return pdfi_dict_find_unsorted(ctx, d, Key);
294
149M
    } else
295
87.6M
        return pdfi_dict_find_sorted(ctx, d, Key);
296
236M
}
297
298
static int pdfi_dict_find_key(pdf_context *ctx, pdf_dict *d, const pdf_name *Key, bool sort)
299
140M
{
300
140M
    char *Test = NULL;
301
140M
    int index = 0;
302
303
140M
    Test = (char *)gs_alloc_bytes(ctx->memory, (size_t)Key->length + 1, "pdfi_dict_find_key");
304
140M
    if (Test == NULL)
305
0
        return_error(gs_error_VMerror);
306
307
140M
    memcpy(Test, Key->data, Key->length);
308
140M
    Test[Key->length] = 0x00;
309
310
140M
    index = pdfi_dict_find(ctx, d, Test, sort);
311
312
140M
    gs_free_object(ctx->memory, Test, "pdfi_dict_find_key");
313
140M
    return index;
314
140M
}
315
316
/* The object returned by pdfi_dict_get has its reference count incremented by 1 to
317
 * indicate the reference now held by the caller, in **o.
318
 */
319
int pdfi_dict_get_common(pdf_context *ctx, pdf_dict *d, const char *Key, pdf_obj **o, bool cache)
320
42.6M
{
321
42.6M
    int index = 0, code = 0;
322
323
42.6M
    *o = NULL;
324
325
42.6M
    if (pdfi_type_of(d) != PDF_DICT)
326
49.9k
        return_error(gs_error_typecheck);
327
328
42.6M
    index = pdfi_dict_find(ctx, d, Key, true);
329
42.6M
    if (index < 0)
330
10.2M
        return index;
331
332
32.3M
    if (pdfi_type_of(d->list[index].value) == PDF_INDIRECT) {
333
1.39M
        pdf_indirect_ref *r = (pdf_indirect_ref *)d->list[index].value;
334
335
1.39M
        if (r->ref_object_num == d->object_num)
336
747
            return_error(gs_error_circular_reference);
337
338
1.39M
        if (cache)
339
1.39M
            code = pdfi_deref_loop_detect(ctx, r->ref_object_num, r->ref_generation_num, o);
340
0
        else
341
0
            code = pdfi_deref_loop_detect_nocache(ctx, r->ref_object_num, r->ref_generation_num, o);
342
1.39M
        if (code < 0)
343
451k
            return code;
344
        /* The file Bug690138.pdf has font dictionaries which contain ToUnicode keys where
345
         * the value is an indirect reference to the same font object. If we replace the
346
         * indirect reference in the dictionary with the font dictionary it becomes self
347
         * referencing and never counts down to 0, leading to a memory leak.
348
         * This is clearly an error, so flag it and don't replace the indirect reference.
349
         */
350
944k
        if ((*o) < (pdf_obj *)(uintptr_t)(TOKEN__LAST_KEY)) {
351
            /* "FAST" object, therefore can't be a problem. */
352
815
            pdfi_countdown(d->list[index].value);
353
815
            d->list[index].value = *o;
354
943k
        } else if ((*o)->object_num == 0 || (*o)->object_num != d->object_num) {
355
943k
            pdfi_countdown(d->list[index].value);
356
943k
            d->list[index].value = *o;
357
943k
        } else {
358
0
            code = pdfi_set_error_stop(ctx, gs_note_error(gs_error_undefinedresult), NULL, E_DICT_SELF_REFERENCE, "pdfi_dict_get", NULL);
359
0
            return code;
360
0
        }
361
944k
    }
362
31.8M
    *o = d->list[index].value;
363
31.8M
    pdfi_countup(*o);
364
365
31.8M
    return code;
366
32.3M
}
367
368
/* Get object from dict without resolving indirect references
369
 * Will inc refcnt by 1
370
 */
371
int pdfi_dict_get_no_deref(pdf_context *ctx, pdf_dict *d, const pdf_name *Key, pdf_obj **o)
372
421k
{
373
421k
    int index=0;
374
375
421k
    *o = NULL;
376
377
421k
    if (pdfi_type_of(d) != PDF_DICT)
378
0
        return_error(gs_error_typecheck);
379
380
421k
    index = pdfi_dict_find_key(ctx, d, Key, true);
381
421k
    if (index < 0)
382
0
        return index;
383
384
421k
    *o = d->list[index].value;
385
421k
    pdfi_countup(*o);
386
421k
    return 0;
387
421k
}
388
389
/* Get by pdf_name rather than by char *
390
 * The object returned by pdfi_dict_get has its reference count incremented by 1 to
391
 * indicate the reference now held by the caller, in **o.
392
 */
393
int pdfi_dict_get_by_key(pdf_context *ctx, pdf_dict *d, const pdf_name *Key, pdf_obj **o)
394
90.1M
{
395
90.1M
    int index=0, code = 0;
396
397
90.1M
    *o = NULL;
398
399
90.1M
    if (pdfi_type_of(d) != PDF_DICT)
400
263
        return_error(gs_error_typecheck);
401
402
90.1M
    index = pdfi_dict_find_key(ctx, d, Key, true);
403
90.1M
    if (index < 0)
404
5.05M
        return index;
405
406
85.1M
    if (pdfi_type_of(d->list[index].value) == PDF_INDIRECT) {
407
75.4k
        pdf_indirect_ref *r = (pdf_indirect_ref *)d->list[index].value;
408
409
75.4k
        code = pdfi_deref_loop_detect(ctx, r->ref_object_num, r->ref_generation_num, o);
410
75.4k
        if (code < 0)
411
28.6k
            return code;
412
46.7k
        pdfi_countdown(d->list[index].value);
413
46.7k
        d->list[index].value = *o;
414
46.7k
    }
415
85.0M
    *o = d->list[index].value;
416
85.0M
    pdfi_countup(*o);
417
85.0M
    return 0;
418
85.1M
}
419
420
/* Get indirect reference without de-referencing it */
421
int pdfi_dict_get_ref(pdf_context *ctx, pdf_dict *d, const char *Key, pdf_indirect_ref **o)
422
0
{
423
0
    int index=0;
424
425
0
    *o = NULL;
426
427
0
    if (pdfi_type_of(d) != PDF_DICT)
428
0
        return_error(gs_error_typecheck);
429
430
0
    index = pdfi_dict_find(ctx, d, Key, true);
431
0
    if (index < 0)
432
0
        return index;
433
434
0
    if (pdfi_type_of(d->list[index].value) == PDF_INDIRECT) {
435
0
        *o = (pdf_indirect_ref *)d->list[index].value;
436
0
        pdfi_countup(*o);
437
0
        return 0;
438
0
    } else {
439
0
        return_error(gs_error_typecheck);
440
0
    }
441
0
}
442
443
/* As per pdfi_dict_get(), but doesn't replace an indirect reference in a dictionary with a
444
 * new object. This is for Resources following, such as Do, where we will have to seek and
445
 * read the indirect object anyway, and we need to ensure that Form XObjects (for example)
446
 * don't have circular calls.
447
 *
448
 * Takes either strKey or nameKey param. Other will be NULL.
449
 */
450
static int pdfi_dict_get_no_store_R_inner(pdf_context *ctx, pdf_dict *d, const char *strKey,
451
                                          const pdf_name *nameKey, pdf_obj **o)
452
3.26M
{
453
3.26M
    int index=0, code = 0;
454
455
3.26M
    *o = NULL;
456
457
3.26M
    if (pdfi_type_of(d) != PDF_DICT)
458
0
        return_error(gs_error_typecheck);
459
460
3.26M
    if (strKey == NULL)
461
2.59M
        index = pdfi_dict_find_key(ctx, d, nameKey, true);
462
667k
    else
463
667k
        index = pdfi_dict_find(ctx, d, strKey, true);
464
465
3.26M
    if (index < 0)
466
140k
        return index;
467
468
3.12M
    if (pdfi_type_of(d->list[index].value) == PDF_INDIRECT) {
469
2.61M
        pdf_indirect_ref *r = (pdf_indirect_ref *)d->list[index].value;
470
471
2.61M
        code = pdfi_dereference(ctx, r->ref_object_num, r->ref_generation_num, o);
472
2.61M
        if (code < 0)
473
1.11M
            return code;
474
2.61M
    } else {
475
510k
        *o = d->list[index].value;
476
510k
        pdfi_countup(*o);
477
510k
    }
478
2.00M
    return 0;
479
3.12M
}
480
481
/* Wrapper to pdfi_dict_no_store_R_inner(), takes a char * as Key */
482
int pdfi_dict_get_no_store_R(pdf_context *ctx, pdf_dict *d, const char *Key, pdf_obj **o)
483
667k
{
484
667k
    return pdfi_dict_get_no_store_R_inner(ctx, d, Key, NULL, o);
485
667k
}
486
487
/* Wrapper to pdfi_dict_no_store_R_inner(), takes a pdf_name * as Key */
488
int pdfi_dict_get_no_store_R_key(pdf_context *ctx, pdf_dict *d, const pdf_name *Key, pdf_obj **o)
489
2.59M
{
490
2.59M
    return pdfi_dict_get_no_store_R_inner(ctx, d, NULL, Key, o);
491
2.59M
}
492
493
/* Convenience routine for common case where there are two possible keys */
494
int
495
pdfi_dict_get_type2(pdf_context *ctx, pdf_dict *d, const char *Key1, const char *Key2, pdf_obj_type type, pdf_obj **o)
496
0
{
497
0
    int code;
498
499
    /* ISO 32000-2:2020 (PDF 2.0) - abbreviated names take precendence. Assume abbreviated names are shorter :-) */
500
0
    if (strlen(Key1) < strlen(Key2)) {
501
0
        code = pdfi_dict_get_type(ctx, d, Key1, type, o);
502
0
        if (code == gs_error_undefined)
503
0
            code = pdfi_dict_get_type(ctx, d, Key2, type, o);
504
0
    } else {
505
0
        code = pdfi_dict_get_type(ctx, d, Key2, type, o);
506
0
        if (code == gs_error_undefined)
507
0
            code = pdfi_dict_get_type(ctx, d, Key1, type, o);
508
0
    }
509
0
    return code;
510
0
}
511
512
int pdfi_dict_get_type(pdf_context *ctx, pdf_dict *d, const char *Key, pdf_obj_type type, pdf_obj **o)
513
20.5M
{
514
20.5M
    int code;
515
516
20.5M
    code = pdfi_dict_get(ctx, d, Key, o);
517
20.5M
    if (code < 0)
518
2.18M
        return code;
519
520
18.3M
    if (pdfi_type_of(*o) != type) {
521
19.6k
        pdfi_countdown(*o);
522
19.6k
        *o = NULL;
523
19.6k
        return_error(gs_error_typecheck);
524
19.6k
    }
525
18.3M
    return 0;
526
18.3M
}
527
528
int pdfi_dict_get_type_no_store_R(pdf_context *ctx, pdf_dict *d, const char *Key, pdf_obj_type type, pdf_obj **o)
529
163
{
530
163
    int code;
531
532
163
    code = pdfi_dict_get_no_store_R(ctx, d, Key, o);
533
163
    if (code < 0)
534
12
        return code;
535
536
151
    if (pdfi_type_of(*o) != type) {
537
0
        pdfi_countdown(*o);
538
0
        *o = NULL;
539
0
        return_error(gs_error_typecheck);
540
0
    }
541
151
    return 0;
542
151
}
543
544
/* Convenience routine for common case where value has two possible keys */
545
int
546
pdfi_dict_get_int2(pdf_context *ctx, pdf_dict *d, const char *Key1,
547
                   const char *Key2, int64_t *i)
548
375k
{
549
375k
    int code;
550
551
    /* ISO 32000-2:2020 (PDF 2.0) - abbreviated names take precendence. Assume abbreviated names are shorter :-) */
552
375k
    if (strlen(Key1) < strlen(Key2)) {
553
0
        code = pdfi_dict_get_int(ctx, d, Key1, i);
554
0
        if (code == gs_error_undefined)
555
0
            code = pdfi_dict_get_int(ctx, d, Key2, i);
556
375k
    } else {
557
375k
        code = pdfi_dict_get_int(ctx, d, Key2, i);
558
375k
        if (code == gs_error_undefined)
559
104k
            code = pdfi_dict_get_int(ctx, d, Key1, i);
560
375k
    }
561
375k
    return code;
562
375k
}
563
564
int pdfi_dict_get_int(pdf_context *ctx, pdf_dict *d, const char *Key, int64_t *i)
565
6.77M
{
566
6.77M
    int code;
567
6.77M
    pdf_obj *n;
568
569
6.77M
    code = pdfi_dict_get(ctx, d, Key, &n);
570
6.77M
    if (code < 0)
571
1.41M
        return code;
572
5.35M
    code = pdfi_obj_to_int(ctx, n, i);
573
5.35M
    pdfi_countdown(n);
574
5.35M
    return code;
575
6.77M
}
576
577
/* Get an int from dict, and if undefined, return provided default */
578
int pdfi_dict_get_int_def(pdf_context *ctx, pdf_dict *d, const char *Key, int64_t *i,
579
                          int64_t def_val)
580
156k
{
581
156k
    int code;
582
583
156k
    code = pdfi_dict_get_int(ctx, d, Key, i);
584
156k
    if (code == gs_error_undefined) {
585
24.4k
        *i = def_val;
586
24.4k
        code = 0;
587
24.4k
    }
588
589
156k
    return code;
590
156k
}
591
592
/* Convenience routine for common case where value has two possible keys */
593
int
594
pdfi_dict_get_bool2(pdf_context *ctx, pdf_dict *d, const char *Key1,
595
                    const char *Key2, bool *val)
596
751k
{
597
751k
    int code;
598
599
    /* ISO 32000-2:2020 (PDF 2.0) - abbreviated names take precendence. Assume abbreviated names are shorter :-) */
600
751k
    if (strlen(Key1) < strlen(Key2)) {
601
0
        code = pdfi_dict_get_bool(ctx, d, Key1, val);
602
0
        if (code == gs_error_undefined)
603
0
            code = pdfi_dict_get_bool(ctx, d, Key2, val);
604
751k
    } else {
605
751k
        code = pdfi_dict_get_bool(ctx, d, Key2, val);
606
751k
        if (code == gs_error_undefined)
607
480k
            code = pdfi_dict_get_bool(ctx, d, Key1, val);
608
751k
    }
609
751k
    return code;
610
751k
}
611
612
int pdfi_dict_get_bool(pdf_context *ctx, pdf_dict *d, const char *Key, bool *val)
613
1.96M
{
614
1.96M
    int code;
615
1.96M
    pdf_obj *b;
616
617
1.96M
    code = pdfi_dict_get(ctx, d, Key, &b);
618
1.96M
    if (code < 0)
619
1.18M
        return code;
620
621
780k
    if (b == PDF_TRUE_OBJ) {
622
447k
        *val = 1;
623
447k
        return 0;
624
447k
    } else if (b == PDF_FALSE_OBJ) {
625
332k
        *val = 0;
626
332k
        return 0;
627
332k
    }
628
629
83
    pdfi_countdown(b);
630
631
83
    *val = 0; /* Be consistent at least! */
632
83
    return_error(gs_error_typecheck);
633
780k
}
634
635
int pdfi_dict_get_number2(pdf_context *ctx, pdf_dict *d, const char *Key1, const char *Key2, double *f)
636
754k
{
637
754k
    int code;
638
639
    /* ISO 32000-2:2020 (PDF 2.0) - abbreviated names take precendence. Assume abbreviated names are shorter :-) */
640
754k
    if (strlen(Key1) < strlen(Key2)) {
641
0
        code = pdfi_dict_get_number(ctx, d, Key1, f);
642
0
        if (code == gs_error_undefined)
643
0
            code = pdfi_dict_get_number(ctx, d, Key2, f);
644
754k
    } else {
645
754k
        code = pdfi_dict_get_number(ctx, d, Key2, f);
646
754k
        if (code == gs_error_undefined)
647
208k
            code = pdfi_dict_get_number(ctx, d, Key1, f);
648
754k
    }
649
754k
    return code;
650
754k
}
651
652
int pdfi_dict_get_number(pdf_context *ctx, pdf_dict *d, const char *Key, double *f)
653
2.92M
{
654
2.92M
    int code;
655
2.92M
    pdf_obj *o;
656
657
2.92M
    code = pdfi_dict_get(ctx, d, Key, &o);
658
2.92M
    if (code < 0)
659
1.11M
        return code;
660
1.80M
    code = pdfi_obj_to_real(ctx, o, f);
661
1.80M
    pdfi_countdown(o);
662
663
1.80M
    return code;
664
2.92M
}
665
666
/* convenience functions for retrieving arrys, see shadings and functions */
667
668
/* The 'fill' versions fill existing arrays, and need a size,
669
 * the 'make' versions allocate memory and fill it. Both varieties return the
670
 * number of entries on success. The fill Matrix utility expects to always
671
 * receive 6 values. The Domain function expects to receive an even number of
672
 * entries and each pair must have the second element larger than the first.
673
 */
674
int fill_domain_from_dict(pdf_context *ctx, float *parray, int size, pdf_dict *dict)
675
15.6k
{
676
15.6k
    int code, i;
677
15.6k
    pdf_array *a = NULL;
678
15.6k
    double f;
679
15.6k
    uint64_t array_size;
680
681
15.6k
    code = pdfi_dict_get(ctx, dict, "Domain", (pdf_obj **)&a);
682
15.6k
    if (code < 0)
683
7.09k
        return code;
684
8.56k
    if (pdfi_type_of(a) != PDF_ARRAY) {
685
0
        pdfi_countdown(a);
686
0
        return_error(gs_error_typecheck);
687
0
    }
688
8.56k
    array_size = pdfi_array_size(a);
689
8.56k
    if (array_size & 1 || array_size > size) {
690
11
        pdfi_countdown(a);
691
11
        return_error(gs_error_rangecheck);
692
11
    }
693
694
25.6k
    for (i=0;i< array_size;i++) {
695
17.1k
        code = pdfi_array_get_number(ctx, a, (uint64_t)i, &f);
696
17.1k
        if (code < 0) {
697
9
            pdfi_countdown(a);
698
9
            return_error(code);
699
9
        }
700
17.0k
        parray[i] = (float)f;
701
17.0k
    }
702
8.54k
    pdfi_countdown(a);
703
8.54k
    return array_size;
704
8.55k
}
705
706
int fill_float_array_from_dict(pdf_context *ctx, float *parray, int size, pdf_dict *dict, const char *Key)
707
17.3k
{
708
17.3k
    int code, i;
709
17.3k
    pdf_array *a = NULL;
710
17.3k
    double f;
711
17.3k
    uint64_t array_size;
712
713
17.3k
    code = pdfi_dict_get(ctx, dict, Key, (pdf_obj **)&a);
714
17.3k
    if (code < 0)
715
37
        return code;
716
17.3k
    if (pdfi_type_of(a) != PDF_ARRAY) {
717
0
        code = gs_note_error(gs_error_typecheck);
718
0
        goto exit;
719
0
    }
720
17.3k
    array_size = pdfi_array_size(a);
721
17.3k
    if (array_size > size) {
722
5
        code = gs_note_error(gs_error_rangecheck);
723
5
        goto exit;
724
5
    }
725
726
96.5k
    for (i=0; i< array_size; i++) {
727
79.1k
        code = pdfi_array_get_number(ctx, a, (uint64_t)i, &f);
728
79.1k
        if (code < 0)
729
9
            goto exit;
730
79.1k
        parray[i] = (float)f;
731
79.1k
    }
732
17.3k
    code = array_size;
733
17.3k
 exit:
734
17.3k
    pdfi_countdown(a);
735
17.3k
    return code;
736
17.3k
}
737
738
int fill_bool_array_from_dict(pdf_context *ctx, bool *parray, int size, pdf_dict *dict, const char *Key)
739
15.6k
{
740
15.6k
    int code, i;
741
15.6k
    pdf_array *a = NULL;
742
15.6k
    pdf_obj *o;
743
15.6k
    uint64_t array_size;
744
745
15.6k
    code = pdfi_dict_get(ctx, dict, Key, (pdf_obj **)&a);
746
15.6k
    if (code < 0)
747
411
        return code;
748
15.2k
    if (pdfi_type_of(a) != PDF_ARRAY) {
749
0
        pdfi_countdown(a);
750
0
        return_error(gs_error_typecheck);
751
0
    }
752
15.2k
    array_size = pdfi_array_size(a);
753
15.2k
    if (array_size > size)
754
0
        return_error(gs_error_rangecheck);
755
756
45.6k
    for (i=0;i< array_size;i++) {
757
30.4k
        code = pdfi_array_get(ctx, a, (uint64_t)i, (pdf_obj **)&o);
758
30.4k
        if (code < 0) {
759
0
            pdfi_countdown(a);
760
0
            return_error(code);
761
0
        }
762
30.4k
        if (o == PDF_TRUE_OBJ) {
763
29.4k
            parray[i] = 1;
764
29.4k
        } else if (o == PDF_FALSE_OBJ) {
765
997
            parray[i] = 0;
766
997
        } else {
767
7
            pdfi_countdown(o);
768
7
            pdfi_countdown(a);
769
7
            return_error(gs_error_typecheck);
770
7
        }
771
30.4k
    }
772
15.2k
    pdfi_countdown(a);
773
15.2k
    return array_size;
774
15.2k
}
775
776
int fill_matrix_from_dict(pdf_context *ctx, float *parray, pdf_dict *dict)
777
10
{
778
10
    int code, i;
779
10
    pdf_array *a = NULL;
780
10
    double f;
781
10
    uint64_t array_size;
782
783
10
    code = pdfi_dict_get(ctx, dict, "Matrix", (pdf_obj **)&a);
784
10
    if (code < 0)
785
10
        return code;
786
0
    if (pdfi_type_of(a) != PDF_ARRAY) {
787
0
        pdfi_countdown(a);
788
0
        return_error(gs_error_typecheck);
789
0
    }
790
0
    array_size = pdfi_array_size(a);
791
0
    if (array_size != 6) {
792
0
        pdfi_countdown(a);
793
0
        return_error(gs_error_rangecheck);
794
0
    }
795
796
0
    for (i=0; i< array_size; i++) {
797
0
        code = pdfi_array_get_number(ctx, a, (uint64_t)i, &f);
798
0
        if (code < 0) {
799
0
            pdfi_countdown(a);
800
0
            return_error(code);
801
0
        }
802
0
        parray[i] = (float)f;
803
0
    }
804
0
    pdfi_countdown(a);
805
0
    return array_size;
806
0
}
807
808
/* Returns < 0 for error or the number of entries allocated */
809
int pdfi_make_float_array_from_dict(pdf_context *ctx, float **parray, pdf_dict *dict, const char *Key)
810
250k
{
811
250k
    int code, i;
812
250k
    pdf_array *a = NULL;
813
250k
    float *arr = NULL;
814
250k
    double f;
815
250k
    uint64_t array_size;
816
817
250k
    *parray = NULL;
818
819
250k
    code = pdfi_dict_get(ctx, dict, Key, (pdf_obj **)&a);
820
250k
    if (code < 0)
821
44.2k
        return code;
822
205k
    if (pdfi_type_of(a) != PDF_ARRAY) {
823
0
        pdfi_countdown(a);
824
0
        return_error(gs_error_typecheck);
825
0
    }
826
205k
    array_size = pdfi_array_size(a);
827
828
205k
    arr = (float *)gs_alloc_byte_array(ctx->memory, array_size,
829
205k
                                       sizeof(float), "array_from_dict_key");
830
205k
    if (arr == NULL)
831
0
        return_error(gs_error_VMerror);
832
833
205k
    *parray = arr;
834
835
887k
    for (i=0;i< array_size;i++) {
836
681k
        code = pdfi_array_get_number(ctx, a, (uint64_t)i, &f);
837
681k
        if (code < 0) {
838
210
            gs_free_const_object(ctx->memory, arr, "float_array");
839
210
            *parray = NULL;
840
210
            pdfi_countdown(a);
841
210
            return_error(code);
842
210
        }
843
681k
        (*parray)[i] = (float)f;
844
681k
    }
845
205k
    pdfi_countdown(a);
846
205k
    return array_size;
847
205k
}
848
849
int pdfi_make_int_array_from_dict(pdf_context *ctx, int **parray, pdf_dict *dict, const char *Key)
850
17.9k
{
851
17.9k
    int code, i;
852
17.9k
    pdf_array *a = NULL;
853
17.9k
    int *arr = NULL;
854
17.9k
    pdf_num *o;
855
17.9k
    uint64_t array_size;
856
857
17.9k
    *parray = NULL;
858
859
17.9k
    code = pdfi_dict_get(ctx, dict, Key, (pdf_obj **)&a);
860
17.9k
    if (code < 0)
861
41
        return code;
862
17.9k
    if (pdfi_type_of(a) != PDF_ARRAY) {
863
0
        pdfi_countdown(a);
864
0
        return_error(gs_error_typecheck);
865
0
    }
866
17.9k
    array_size = pdfi_array_size(a);
867
17.9k
    arr = (int *)gs_alloc_byte_array(ctx->memory, array_size,
868
17.9k
                                     sizeof(int), "array_from_dict_key");
869
17.9k
    if (arr == NULL)
870
0
        return_error(gs_error_VMerror);
871
872
17.9k
    *parray = arr;
873
874
36.9k
    for (i=0;i< array_size;i++) {
875
19.0k
        code = pdfi_array_get_type(ctx, a, (uint64_t)i, PDF_INT, (pdf_obj **)&o);
876
19.0k
        if (code < 0) {
877
58
            gs_free_const_object(ctx->memory, arr, "int_array");
878
58
            *parray = NULL;
879
58
            pdfi_countdown(a);
880
58
            return_error(code);
881
58
        }
882
19.0k
        (*parray)[i] = (int)o->value.i;
883
19.0k
        pdfi_countdown(o);
884
19.0k
    }
885
17.8k
    pdfi_countdown(a);
886
17.8k
    return array_size;
887
17.9k
}
888
889
/* Put into dictionary with key as object -
890
   If the key already exists, we'll only replace it
891
   if "replace" is true.
892
*/
893
int pdfi_dict_put_obj(pdf_context *ctx, pdf_dict *d, pdf_obj *Key, pdf_obj *value, bool replace)
894
47.0M
{
895
47.0M
    int i;
896
47.0M
    pdf_dict_entry *new_list;
897
898
47.0M
    if (pdfi_type_of(d) != PDF_DICT)
899
0
        return_error(gs_error_typecheck);
900
901
47.0M
    if (pdfi_type_of(Key) != PDF_NAME)
902
0
        return_error(gs_error_typecheck);
903
904
    /* First, do we have a Key/value pair already ? */
905
47.0M
    i = pdfi_dict_find_key(ctx, d, (pdf_name *)Key, false);
906
47.0M
    if (i >= 0) {
907
100k
        if (d->list[i].value == value || replace == false)
908
            /* We already have this value stored with this key.... */
909
91.8k
            return 0;
910
8.46k
        pdfi_countdown(d->list[i].value);
911
8.46k
        d->list[i].value = value;
912
8.46k
        pdfi_countup(value);
913
8.46k
        return 0;
914
100k
    }
915
916
46.9M
    d->is_sorted = false;
917
918
    /* Nope, its a new Key */
919
46.9M
    if (d->size > d->entries) {
920
        /* We have a hole, find and use it */
921
19.9G
        for (i=0;i< d->size;i++) {
922
19.9G
            if (d->list[i].key == NULL) {
923
45.3M
                d->list[i].key = Key;
924
45.3M
                pdfi_countup(Key);
925
45.3M
                d->list[i].value = value;
926
45.3M
                pdfi_countup(value);
927
45.3M
                d->entries++;
928
45.3M
                return 0;
929
45.3M
            }
930
19.9G
        }
931
45.3M
    }
932
933
1.51M
    new_list = (pdf_dict_entry *)gs_alloc_bytes(ctx->memory, (size_t)(d->size + 1) * sizeof(pdf_dict_entry), "pdfi_dict_put reallocate dictionary key/values");
934
1.51M
    if (new_list == NULL) {
935
0
        return_error(gs_error_VMerror);
936
0
    }
937
1.51M
    if (d->size > 0)
938
1.35M
        memcpy(new_list, d->list, d->size * sizeof(pdf_dict_entry));
939
940
1.51M
    gs_free_object(ctx->memory, d->list, "pdfi_dict_put key/value reallocation");
941
942
1.51M
    d->list = new_list;
943
944
1.51M
    d->list[d->size].key = Key;
945
1.51M
    d->list[d->size].value = value;
946
1.51M
    d->size++;
947
1.51M
    d->entries++;
948
1.51M
    pdfi_countup(Key);
949
1.51M
    pdfi_countup(value);
950
951
1.51M
    return 0;
952
1.51M
}
953
954
/*
955
 * Be very cautious using this routine; it does not check to see if a key already exists
956
 * in a dictionary!. This is initially at least intended for use by the font code, to build
957
 * a CharStrings dictionary. We do that by adding each glyph individually with a name
958
 * created from a loop counter, so we know there cannot be any duplicates, and the time
959
 * taken to check that each of 64K names was unique was quite significant.
960
 * See bug #705534, the old PDF interpreter (nullpage, 72 dpi) runs this file in ~20 seconds
961
 * pdfi runs it in around 40 seconds. With this change it runs in around 3 seconds. THis is,
962
 * of course, an extreme example.
963
 */
964
int pdfi_dict_put_unchecked(pdf_context *ctx, pdf_dict *d, const char *Key, pdf_obj *value)
965
3.17M
{
966
3.17M
    int i, code = 0;
967
3.17M
    pdf_dict_entry *new_list;
968
3.17M
    pdf_obj *key = NULL;
969
970
3.17M
    code = pdfi_name_alloc(ctx, (byte *)Key, strlen(Key), &key);
971
3.17M
    if (code < 0)
972
0
        return code;
973
3.17M
    pdfi_countup(key);
974
975
3.17M
    if (d->size > d->entries) {
976
3.17M
        int search_start = d->entries < 1 ? 0 : d->entries - 1;
977
3.17M
        do {
978
            /* We have a hole, find and use it */
979
6.35M
            for (i = search_start; i < d->size; i++) {
980
6.35M
                if (d->list[i].key == NULL) {
981
3.17M
                    d->list[i].key = key;
982
3.17M
                    d->list[i].value = value;
983
3.17M
                    pdfi_countup(value);
984
3.17M
                    d->entries++;
985
3.17M
                    return 0;
986
3.17M
                }
987
6.35M
            }
988
0
            if (search_start == 0) {
989
                /* This shouldn't ever happen, but just in case.... */
990
0
                break;
991
0
            }
992
0
            search_start = 0;
993
0
        } while(1);
994
3.17M
    }
995
996
0
    new_list = (pdf_dict_entry *)gs_alloc_bytes(ctx->memory, (size_t)(d->size + 1) * sizeof(pdf_dict_entry), "pdfi_dict_put reallocate dictionary key/values");
997
0
    if (new_list == NULL) {
998
0
        return_error(gs_error_VMerror);
999
0
    }
1000
0
    memcpy(new_list, d->list, d->size * sizeof(pdf_dict_entry));
1001
1002
0
    gs_free_object(ctx->memory, d->list, "pdfi_dict_put key/value reallocation");
1003
1004
0
    d->list = new_list;
1005
1006
0
    d->list[d->size].key = key;
1007
0
    d->list[d->size].value = value;
1008
0
    d->size++;
1009
0
    d->entries++;
1010
0
    pdfi_countup(value);
1011
1012
0
    return 0;
1013
0
}
1014
1015
/* Put into dictionary with key as string */
1016
int pdfi_dict_put(pdf_context *ctx, pdf_dict *d, const char *Key, pdf_obj *value)
1017
2.43M
{
1018
2.43M
    int code;
1019
2.43M
    pdf_obj *key = NULL;
1020
1021
2.43M
    code = pdfi_name_alloc(ctx, (byte *)Key, strlen(Key), &key);
1022
2.43M
    if (code < 0)
1023
0
        return code;
1024
2.43M
    pdfi_countup(key);
1025
1026
2.43M
    code = pdfi_dict_put_obj(ctx, d, key, value, true);
1027
2.43M
    pdfi_countdown(key); /* get rid of extra ref */
1028
2.43M
    return code;
1029
2.43M
}
1030
1031
int pdfi_dict_put_int(pdf_context *ctx, pdf_dict *d, const char *key, int64_t value)
1032
7.72k
{
1033
7.72k
    int code;
1034
7.72k
    pdf_num *obj;
1035
1036
7.72k
    code = pdfi_object_alloc(ctx, PDF_INT, 0, (pdf_obj **)&obj);
1037
7.72k
    if (code < 0)
1038
0
        return code;
1039
7.72k
    obj->value.i = value;
1040
1041
7.72k
    return pdfi_dict_put(ctx, d, key, (pdf_obj *)obj);
1042
7.72k
}
1043
1044
int pdfi_dict_put_bool(pdf_context *ctx, pdf_dict *d, const char *key, bool value)
1045
4.62k
{
1046
4.62k
    pdf_obj *obj = (value ? PDF_TRUE_OBJ : PDF_FALSE_OBJ);
1047
1048
4.62k
    return pdfi_dict_put(ctx, d, key, obj);
1049
4.62k
}
1050
1051
int pdfi_dict_put_name(pdf_context *ctx, pdf_dict *d, const char *key, const char *name)
1052
0
{
1053
0
    int code;
1054
0
    pdf_obj *obj = NULL;
1055
1056
0
    code = pdfi_name_alloc(ctx, (byte *)name, strlen(name), &obj);
1057
0
    if (code < 0)
1058
0
        return code;
1059
0
    pdfi_countup(obj);
1060
1061
0
    code = pdfi_dict_put(ctx, d, key, obj);
1062
0
    pdfi_countdown(obj); /* get rid of extra ref */
1063
0
    return code;
1064
0
}
1065
1066
int pdfi_dict_copy(pdf_context *ctx, pdf_dict *target, pdf_dict *source)
1067
61.0k
{
1068
61.0k
    int i=0, code = 0;
1069
1070
535k
    for (i=0;i< source->entries;i++) {
1071
474k
        code = pdfi_dict_put_obj(ctx, target, source->list[i].key, source->list[i].value, true);
1072
474k
        if (code < 0)
1073
0
            return code;
1074
474k
        target->is_sorted = source->is_sorted;
1075
474k
    }
1076
61.0k
    return 0;
1077
61.0k
}
1078
1079
int pdfi_dict_known(pdf_context *ctx, pdf_dict *d, const char *Key, bool *known)
1080
52.9M
{
1081
52.9M
    int i;
1082
1083
52.9M
    if (pdfi_type_of(d) != PDF_DICT)
1084
5.22k
        return_error(gs_error_typecheck);
1085
1086
52.9M
    *known = false;
1087
52.9M
    i = pdfi_dict_find(ctx, d, Key, true);
1088
52.9M
    if (i >= 0)
1089
17.7M
        *known = true;
1090
1091
52.9M
    return 0;
1092
52.9M
}
1093
1094
int pdfi_dict_known_by_key(pdf_context *ctx, pdf_dict *d, pdf_name *Key, bool *known)
1095
99.9k
{
1096
99.9k
    int i;
1097
1098
99.9k
    if (pdfi_type_of(d) != PDF_DICT)
1099
0
        return_error(gs_error_typecheck);
1100
1101
99.9k
    *known = false;
1102
99.9k
    i = pdfi_dict_find_key(ctx, d, Key, true);
1103
99.9k
    if (i >= 0)
1104
88.9k
        *known = true;
1105
1106
99.9k
    return 0;
1107
99.9k
}
1108
1109
/* Tests if a Key is present in the dictionary, if it is, retrieves the value associated with the
1110
 * key. Returns < 0 for error, 0 if the key is not found > 0 if the key is present, and initialises
1111
 * the value in the arguments. Since this uses pdf_dict_get(), the returned value has its
1112
 * reference count incremented by 1, just like pdfi_dict_get().
1113
 */
1114
int pdfi_dict_knownget(pdf_context *ctx, pdf_dict *d, const char *Key, pdf_obj **o)
1115
9.68M
{
1116
9.68M
    bool known = false;
1117
9.68M
    int code;
1118
1119
9.68M
    code = pdfi_dict_known(ctx, d, Key, &known);
1120
9.68M
    if (code < 0)
1121
583
        return code;
1122
1123
9.68M
    if (known == false)
1124
6.44M
        return 0;
1125
1126
3.23M
    code = pdfi_dict_get(ctx, d, Key, o);
1127
3.23M
    if (code < 0)
1128
56.4k
        return code;
1129
1130
3.18M
    return 1;
1131
3.23M
}
1132
1133
/* Like pdfi_dict_knownget() but allows the user to specify a type for the object that we get.
1134
 * returns < 0 for error (including typecheck if the object is not the requested type)
1135
 * 0 if the key is not found, or > 0 if the key was found and returned.
1136
 */
1137
int pdfi_dict_knownget_type(pdf_context *ctx, pdf_dict *d, const char *Key, pdf_obj_type type, pdf_obj **o)
1138
27.0M
{
1139
27.0M
    bool known = false;
1140
27.0M
    int code;
1141
1142
27.0M
    code = pdfi_dict_known(ctx, d, Key, &known);
1143
27.0M
    if (code < 0)
1144
4.64k
        return code;
1145
1146
27.0M
    if (known == false)
1147
14.4M
        return 0;
1148
1149
12.6M
    code = pdfi_dict_get_type(ctx, d, Key, type, o);
1150
12.6M
    if (code < 0)
1151
326k
        return code;
1152
1153
12.2M
    return 1;
1154
12.6M
}
1155
1156
/* As above but don't store any dereferenced object. Used for Annots when we need the /Parent but
1157
 * storing that back to the annot would create a circulare reference to the page object
1158
 */
1159
int pdfi_dict_knownget_type_no_store_R(pdf_context *ctx, pdf_dict *d, const char *Key, pdf_obj_type type, pdf_obj **o)
1160
163
{
1161
163
    bool known = false;
1162
163
    int code;
1163
1164
163
    code = pdfi_dict_known(ctx, d, Key, &known);
1165
163
    if (code < 0)
1166
0
        return code;
1167
1168
163
    if (known == false)
1169
0
        return 0;
1170
1171
163
    code = pdfi_dict_get_type_no_store_R(ctx, d, Key, type, o);
1172
163
    if (code < 0)
1173
12
        return code;
1174
1175
151
    return 1;
1176
163
}
1177
1178
int pdfi_dict_knownget_bool(pdf_context *ctx, pdf_dict *d, const char *Key, bool *b)
1179
13.4k
{
1180
13.4k
    bool known = false;
1181
13.4k
    int code;
1182
1183
13.4k
    code = pdfi_dict_known(ctx, d, Key, &known);
1184
13.4k
    if (code < 0)
1185
0
        return code;
1186
1187
13.4k
    if (known == false)
1188
7.68k
        return 0;
1189
1190
5.79k
    code = pdfi_dict_get_bool(ctx, d, Key, b);
1191
5.79k
    if (code < 0)
1192
0
        return code;
1193
1194
5.79k
    return 1;
1195
5.79k
}
1196
1197
/* Like pdfi_dict_knownget_type() but retrieves numbers (two possible types)
1198
 */
1199
int pdfi_dict_knownget_number(pdf_context *ctx, pdf_dict *d, const char *Key, double *f)
1200
2.08M
{
1201
2.08M
    bool known = false;
1202
2.08M
    int code;
1203
1204
2.08M
    code = pdfi_dict_known(ctx, d, Key, &known);
1205
2.08M
    if (code < 0)
1206
0
        return code;
1207
1208
2.08M
    if (known == false)
1209
1.97M
        return 0;
1210
1211
111k
    code = pdfi_dict_get_number(ctx, d, Key, f);
1212
111k
    if (code < 0)
1213
4
        return code;
1214
1215
111k
    return 1;
1216
111k
}
1217
1218
int pdfi_dict_next(pdf_context *ctx, pdf_dict *d, pdf_obj **Key, pdf_obj **Value, uint64_t *index)
1219
1.74M
{
1220
1.74M
    int code;
1221
1222
1.74M
    if (pdfi_type_of(d) != PDF_DICT)
1223
0
        return_error(gs_error_typecheck);
1224
1225
1.74M
    while (1) {
1226
1.74M
        if (*index >= d->entries) {
1227
154k
            *Key = NULL;
1228
154k
            *Value= NULL;
1229
154k
            return gs_error_undefined;
1230
154k
        }
1231
1232
        /* If we find NULL keys skip over them. This should never
1233
         * happen as we check the number of entries above, and we
1234
         * compact dictionaries on deletion of key/value pairs.
1235
         * This is a belt and braces check in case creation of the
1236
         * dictionary somehow ends up with NULL keys in the allocated
1237
         * section.
1238
         */
1239
1.59M
        *Key = d->list[*index].key;
1240
1.59M
        if (*Key == NULL) {
1241
0
            (*index)++;
1242
0
            continue;
1243
0
        }
1244
1245
1.59M
        if (pdfi_type_of(d->list[*index].value) == PDF_INDIRECT) {
1246
515k
            pdf_indirect_ref *r = (pdf_indirect_ref *)d->list[*index].value;
1247
515k
            pdf_obj *o;
1248
1249
515k
            code = pdfi_dereference(ctx, r->ref_object_num, r->ref_generation_num, &o);
1250
515k
            if (code < 0) {
1251
223k
                if (code == gs_error_circular_reference) {
1252
                    /* Replace circular references with NULL objects to prevent future
1253
                     * circular dereferencing.
1254
                     */
1255
258
                    pdfi_countdown(d->list[*index].value);
1256
258
                    d->list[*index].value = PDF_NULL_OBJ;
1257
258
                }
1258
223k
                *Key = *Value = NULL;
1259
223k
                return code;
1260
223k
            }
1261
            /* The file Bug690138.pdf has font dictionaries which contain ToUnicode keys where
1262
             * the value is an indirect reference to the same font object. If we replace the
1263
             * indirect reference in the dictionary with the font dictionary it becomes self
1264
             * referencing and never counts down to 0, leading to a memory leak.
1265
             * This is clearly an error, so flag it and don't replace the indirect reference.
1266
             */
1267
291k
            if ((o) < (pdf_obj *)(uintptr_t)(TOKEN__LAST_KEY)) {
1268
                /* "FAST" object, therefore can't be a problem. */
1269
1.42k
                pdfi_countdown(d->list[*index].value);
1270
1.42k
                d->list[*index].value = o;
1271
289k
            } else if (o->object_num == 0 || o->object_num != d->object_num) {
1272
289k
                pdfi_countdown(d->list[*index].value);
1273
289k
                d->list[*index].value = o;
1274
289k
            } else {
1275
                /* Replace self references with NULL objects to prevent future
1276
                 * circular dereferencing.
1277
                 */
1278
4
                pdfi_countdown(d->list[*index].value);
1279
4
                d->list[*index].value = PDF_NULL_OBJ;
1280
4
                *Key = *Value = NULL;
1281
4
                code = pdfi_set_error_stop(ctx, gs_note_error(gs_error_undefinedresult), NULL, E_DICT_SELF_REFERENCE, "pdfi_dict_next", NULL);
1282
4
                return code;
1283
4
            }
1284
291k
            *Value = o;
1285
291k
            pdfi_countup(*Value);
1286
291k
            break;
1287
1.07M
        } else {
1288
1.07M
            *Value = d->list[*index].value;
1289
1.07M
            pdfi_countup(*Value);
1290
1.07M
            break;
1291
1.07M
        }
1292
1.59M
    }
1293
1294
1.37M
    pdfi_countup(*Key);
1295
1.37M
    (*index)++;
1296
1.37M
    return 0;
1297
1.74M
}
1298
1299
int pdfi_dict_next_no_store_R(pdf_context *ctx, pdf_dict *d, pdf_obj **Key, pdf_obj **Value, uint64_t *index)
1300
409k
{
1301
409k
    int code;
1302
1303
409k
    if (pdfi_type_of(d) != PDF_DICT)
1304
0
        return_error(gs_error_typecheck);
1305
1306
409k
    while (1) {
1307
409k
        if (*index >= d->entries) {
1308
0
            *Key = NULL;
1309
0
            *Value= NULL;
1310
0
            return gs_error_undefined;
1311
0
        }
1312
1313
        /* If we find NULL keys skip over them. This should never
1314
         * happen as we check the number of entries above, and we
1315
         * compact dictionaries on deletion of key/value pairs.
1316
         * This is a belt and braces check in case creation of the
1317
         * dictionary somehow ends up with NULL keys in the allocated
1318
         * section.
1319
         */
1320
409k
        *Key = d->list[*index].key;
1321
409k
        if (*Key == NULL) {
1322
0
            (*index)++;
1323
0
            continue;
1324
0
        }
1325
1326
409k
        if (pdfi_type_of(d->list[*index].value) == PDF_INDIRECT) {
1327
403k
            pdf_indirect_ref *r = (pdf_indirect_ref *)d->list[*index].value;
1328
403k
            pdf_obj *o;
1329
1330
403k
            code = pdfi_dereference(ctx, r->ref_object_num, r->ref_generation_num, &o);
1331
403k
            if (code < 0) {
1332
60.6k
                *Key = *Value = NULL;
1333
60.6k
                return code;
1334
60.6k
            }
1335
342k
            *Value = o;
1336
342k
            break;
1337
403k
        } else {
1338
5.79k
            *Value = d->list[*index].value;
1339
5.79k
            pdfi_countup(*Value);
1340
5.79k
            break;
1341
5.79k
        }
1342
409k
    }
1343
1344
348k
    pdfi_countup(*Key);
1345
348k
    (*index)++;
1346
348k
    return 0;
1347
409k
}
1348
1349
int pdfi_dict_first(pdf_context *ctx, pdf_dict *d, pdf_obj **Key, pdf_obj **Value, uint64_t *index)
1350
546k
{
1351
546k
    uint64_t *i = index;
1352
1353
546k
    *i = 0;
1354
546k
    return pdfi_dict_next(ctx, d, Key, Value, index);
1355
546k
}
1356
1357
int pdfi_dict_first_no_store_R(pdf_context *ctx, pdf_dict *d, pdf_obj **Key, pdf_obj **Value, uint64_t *index)
1358
196k
{
1359
196k
    uint64_t *i = index;
1360
1361
196k
    *i = 0;
1362
196k
    return pdfi_dict_next_no_store_R(ctx, d, Key, Value, index);
1363
196k
}
1364
1365
int pdfi_dict_key_next(pdf_context *ctx, pdf_dict *d, pdf_obj **Key, uint64_t *index)
1366
92.6M
{
1367
92.6M
    uint64_t *i = index;
1368
1369
92.6M
    if (pdfi_type_of(d) != PDF_DICT)
1370
0
        return_error(gs_error_typecheck);
1371
1372
92.6M
    while (1) {
1373
92.6M
        if (*i >= d->entries) {
1374
252k
            *Key = NULL;
1375
252k
            return gs_error_undefined;
1376
252k
        }
1377
1378
92.4M
        *Key = d->list[*i].key;
1379
92.4M
        if (*Key == NULL) {
1380
0
            (*i)++;
1381
0
            continue;
1382
0
        }
1383
92.4M
        pdfi_countup(*Key);
1384
92.4M
        (*i)++;
1385
92.4M
        break;
1386
92.4M
    }
1387
92.4M
    return 0;
1388
92.6M
}
1389
1390
int pdfi_dict_key_first(pdf_context *ctx, pdf_dict *d, pdf_obj **Key, uint64_t *index)
1391
602k
{
1392
602k
    uint64_t *i = index;
1393
1394
602k
    *i = 0;
1395
602k
    return pdfi_dict_key_next(ctx, d, Key, index);
1396
602k
}
1397
1398
int pdfi_merge_dicts(pdf_context *ctx, pdf_dict *target, pdf_dict *source)
1399
214k
{
1400
214k
    int i, code;
1401
214k
    bool known = false;
1402
1403
313k
    for (i=0;i< source->entries;i++) {
1404
98.9k
        code = pdfi_dict_known_by_key(ctx, target, (pdf_name *)source->list[i].key, &known);
1405
98.9k
        if (code < 0)
1406
0
            return code;
1407
98.9k
        if (!known) {
1408
10.1k
            code = pdfi_dict_put_obj(ctx, target, source->list[i].key, source->list[i].value, true);
1409
10.1k
            if (code < 0)
1410
0
                return code;
1411
10.1k
        }
1412
98.9k
    }
1413
214k
    target->is_sorted = false;
1414
214k
    return 0;
1415
214k
}
1416
1417
/* Return Length of a stream, or 0 if it's not a stream
1418
 * Caches the Length
1419
 */
1420
int64_t pdfi_stream_length(pdf_context *ctx, pdf_stream *stream)
1421
523k
{
1422
523k
    int64_t Length = 0;
1423
523k
    int code;
1424
1425
523k
    if (pdfi_type_of(stream) != PDF_STREAM)
1426
0
        return 0;
1427
1428
523k
    if (stream->length_valid)
1429
245k
        return stream->Length;
1430
1431
278k
    code = pdfi_dict_get_int(ctx, stream->stream_dict, "Length", &Length);
1432
278k
    if (code < 0)
1433
277k
        Length = 0;
1434
1435
    /* Make sure Length is not negative... */
1436
278k
    if (Length < 0)
1437
0
        Length = 0;
1438
1439
    /* Cache it */
1440
278k
    stream->Length = Length;
1441
278k
    stream->length_valid = true;
1442
1443
278k
    return 0;
1444
523k
}
1445
1446
/* Safely get offset from a stream object.
1447
 * If it's not actually a stream, just return 0.
1448
 */
1449
gs_offset_t pdfi_stream_offset(pdf_context *ctx, pdf_stream *stream)
1450
2.67M
{
1451
2.67M
    if (pdfi_type_of(stream) != PDF_STREAM)
1452
87
        return 0;
1453
2.67M
    return stream->stream_offset;
1454
2.67M
}
1455
1456
pdf_stream *pdfi_stream_parent(pdf_context *ctx, pdf_stream *stream)
1457
934k
{
1458
934k
    if (pdfi_type_of(stream) != PDF_STREAM)
1459
46.1k
        return 0;
1460
888k
    return (pdf_stream *)stream->parent_obj;
1461
934k
}
1462
1463
void pdfi_set_stream_parent(pdf_context *ctx, pdf_stream *stream, pdf_stream *parent)
1464
491k
{
1465
    /* Ordinarily we would increment the reference count of the parent object here,
1466
     * because we are taking a new reference to it. But if we do that we will end up
1467
     * with circular references and will never count down and release the objects.
1468
     * This is because the parent object must have a Resources dictionary which
1469
     * references this stream, when we dereference the stream we store it in the
1470
     * Parent's Resources dictionary. So the parent points to the child, the child
1471
     * points to the parent and we always end up with a refcnt for each of 1. Since we
1472
     * only ever consult parent_obj in an illegal case we deal with this by not
1473
     * incrementing the reference count. To try and avoid any dangling references
1474
     * we clear the parent_obj when we finish executing the stream in
1475
     * pdfi_interpret_content_stream.
1476
     */
1477
491k
    stream->parent_obj = (pdf_obj *)parent;
1478
491k
}
1479
1480
void pdfi_clear_stream_parent(pdf_context *ctx, pdf_stream *stream)
1481
491k
{
1482
491k
    stream->parent_obj = NULL;
1483
491k
}
1484
1485
/* Get the dict from a pdf_obj, returns typecheck if it doesn't have one */
1486
int pdfi_dict_from_obj(pdf_context *ctx, pdf_obj *obj, pdf_dict **dict)
1487
88.5M
{
1488
88.5M
    *dict = NULL;
1489
88.5M
    switch (pdfi_type_of(obj)) {
1490
182k
        case PDF_DICT:
1491
182k
            *dict = (pdf_dict *)obj;
1492
182k
            break;
1493
88.3M
        case PDF_STREAM:
1494
88.3M
            *dict = ((pdf_stream *)obj)->stream_dict;
1495
88.3M
            break;
1496
698
        default:
1497
698
            return_error(gs_error_typecheck);
1498
88.5M
    }
1499
88.5M
    return 0;
1500
88.5M
}