Coverage Report

Created: 2025-06-13 07:02

/src/tesseract/src/ccstruct/rejctmap.cpp
Line
Count
Source (jump to first uncovered line)
1
/**********************************************************************
2
 * File:        rejctmap.cpp  (Formerly rejmap.c)
3
 * Description: REJ and REJMAP class functions.
4
 * Author:      Phil Cheatle
5
 *
6
 * (C) Copyright 1994, Hewlett-Packard Ltd.
7
 ** Licensed under the Apache License, Version 2.0 (the "License");
8
 ** you may not use this file except in compliance with the License.
9
 ** You may obtain a copy of the License at
10
 ** http://www.apache.org/licenses/LICENSE-2.0
11
 ** Unless required by applicable law or agreed to in writing, software
12
 ** distributed under the License is distributed on an "AS IS" BASIS,
13
 ** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14
 ** See the License for the specific language governing permissions and
15
 ** limitations under the License.
16
 *
17
 **********************************************************************/
18
19
#include "rejctmap.h"
20
21
#include <memory>
22
23
#include "params.h"
24
25
namespace tesseract {
26
27
0
void REJ::full_print(FILE *fp) const {
28
0
  fprintf(fp, "R_TESS_FAILURE: %s\n", flag(R_TESS_FAILURE) ? "T" : "F");
29
0
  fprintf(fp, "R_SMALL_XHT: %s\n", flag(R_SMALL_XHT) ? "T" : "F");
30
0
  fprintf(fp, "R_EDGE_CHAR: %s\n", flag(R_EDGE_CHAR) ? "T" : "F");
31
0
  fprintf(fp, "R_1IL_CONFLICT: %s\n", flag(R_1IL_CONFLICT) ? "T" : "F");
32
0
  fprintf(fp, "R_POSTNN_1IL: %s\n", flag(R_POSTNN_1IL) ? "T" : "F");
33
0
  fprintf(fp, "R_REJ_CBLOB: %s\n", flag(R_REJ_CBLOB) ? "T" : "F");
34
0
  fprintf(fp, "R_MM_REJECT: %s\n", flag(R_MM_REJECT) ? "T" : "F");
35
0
  fprintf(fp, "R_BAD_REPETITION: %s\n", flag(R_BAD_REPETITION) ? "T" : "F");
36
0
  fprintf(fp, "R_POOR_MATCH: %s\n", flag(R_POOR_MATCH) ? "T" : "F");
37
0
  fprintf(fp, "R_NOT_TESS_ACCEPTED: %s\n",
38
0
          flag(R_NOT_TESS_ACCEPTED) ? "T" : "F");
39
0
  fprintf(fp, "R_CONTAINS_BLANKS: %s\n", flag(R_CONTAINS_BLANKS) ? "T" : "F");
40
0
  fprintf(fp, "R_BAD_PERMUTER: %s\n", flag(R_BAD_PERMUTER) ? "T" : "F");
41
0
  fprintf(fp, "R_HYPHEN: %s\n", flag(R_HYPHEN) ? "T" : "F");
42
0
  fprintf(fp, "R_DUBIOUS: %s\n", flag(R_DUBIOUS) ? "T" : "F");
43
0
  fprintf(fp, "R_NO_ALPHANUMS: %s\n", flag(R_NO_ALPHANUMS) ? "T" : "F");
44
0
  fprintf(fp, "R_MOSTLY_REJ: %s\n", flag(R_MOSTLY_REJ) ? "T" : "F");
45
0
  fprintf(fp, "R_XHT_FIXUP: %s\n", flag(R_XHT_FIXUP) ? "T" : "F");
46
0
  fprintf(fp, "R_BAD_QUALITY: %s\n", flag(R_BAD_QUALITY) ? "T" : "F");
47
0
  fprintf(fp, "R_DOC_REJ: %s\n", flag(R_DOC_REJ) ? "T" : "F");
48
0
  fprintf(fp, "R_BLOCK_REJ: %s\n", flag(R_BLOCK_REJ) ? "T" : "F");
49
0
  fprintf(fp, "R_ROW_REJ: %s\n", flag(R_ROW_REJ) ? "T" : "F");
50
0
  fprintf(fp, "R_UNLV_REJ: %s\n", flag(R_UNLV_REJ) ? "T" : "F");
51
0
  fprintf(fp, "R_HYPHEN_ACCEPT: %s\n", flag(R_HYPHEN_ACCEPT) ? "T" : "F");
52
0
  fprintf(fp, "R_NN_ACCEPT: %s\n", flag(R_NN_ACCEPT) ? "T" : "F");
53
0
  fprintf(fp, "R_MM_ACCEPT: %s\n", flag(R_MM_ACCEPT) ? "T" : "F");
54
0
  fprintf(fp, "R_QUALITY_ACCEPT: %s\n", flag(R_QUALITY_ACCEPT) ? "T" : "F");
55
0
  fprintf(fp, "R_MINIMAL_REJ_ACCEPT: %s\n",
56
0
          flag(R_MINIMAL_REJ_ACCEPT) ? "T" : "F");
57
0
}
58
59
44.4k
REJMAP &REJMAP::operator=(const REJMAP &source) {
60
44.4k
  initialise(source.len);
61
240k
  for (unsigned i = 0; i < len; i++) {
62
196k
    ptr[i] = source.ptr[i];
63
196k
  }
64
44.4k
  return *this;
65
44.4k
}
66
67
127k
void REJMAP::initialise(uint16_t length) {
68
127k
  ptr = std::make_unique<REJ[]>(length);
69
127k
  len = length;
70
127k
}
71
72
0
int16_t REJMAP::accept_count() const { // How many accepted?
73
0
  int16_t count = 0;
74
0
  for (unsigned i = 0; i < len; i++) {
75
0
    if (ptr[i].accepted()) {
76
0
      count++;
77
0
    }
78
0
  }
79
0
  return count;
80
0
}
81
82
0
bool REJMAP::recoverable_rejects() const { // Any non perm rejs?
83
0
  for (unsigned i = 0; i < len; i++) {
84
0
    if (ptr[i].recoverable()) {
85
0
      return true;
86
0
    }
87
0
  }
88
0
  return false;
89
0
}
90
91
0
bool REJMAP::quality_recoverable_rejects() const { // Any potential rejs?
92
0
  for (unsigned i = 0; i < len; i++) {
93
0
    if (ptr[i].accept_if_good_quality()) {
94
0
      return true;
95
0
    }
96
0
  }
97
0
  return false;
98
0
}
99
100
void REJMAP::remove_pos( // Cut out an element
101
    uint16_t pos         // element to remove
102
236
) {
103
236
  ASSERT_HOST(pos < len);
104
236
  ASSERT_HOST(len > 0);
105
106
236
  len--;
107
5.12k
  for (; pos < len; pos++) {
108
4.88k
    ptr[pos] = ptr[pos + 1];
109
4.88k
  }
110
236
}
111
112
0
void REJMAP::print(FILE *fp) const {
113
0
  fputc('"', fp);
114
0
  for (unsigned i = 0; i < len; i++) {
115
0
    fputc( ptr[i].display_char(), fp);
116
0
  }
117
0
  fputc('"', fp);
118
0
}
119
120
0
void REJMAP::full_print(FILE *fp) const {
121
0
  for (unsigned i = 0; i < len; i++) {
122
0
    ptr[i].full_print(fp);
123
0
    fprintf(fp, "\n");
124
0
  }
125
0
}
126
127
0
void REJMAP::rej_word_small_xht() { // Reject whole word
128
0
  for (unsigned i = 0; i < len; i++) {
129
0
    ptr[i].setrej_small_xht();
130
0
  }
131
0
}
132
133
4
void REJMAP::rej_word_tess_failure() { // Reject whole word
134
8
  for (unsigned i = 0; i < len; i++) {
135
4
    ptr[i].setrej_tess_failure();
136
4
  }
137
4
}
138
139
0
void REJMAP::rej_word_not_tess_accepted() { // Reject whole word
140
0
  for (unsigned i = 0; i < len; i++) {
141
0
    if (ptr[i].accepted()) {
142
0
      ptr[i].setrej_not_tess_accepted();
143
0
    }
144
0
  }
145
0
}
146
147
0
void REJMAP::rej_word_contains_blanks() { // Reject whole word
148
0
  for (unsigned i = 0; i < len; i++) {
149
0
    if (ptr[i].accepted()) {
150
0
      ptr[i].setrej_contains_blanks();
151
0
    }
152
0
  }
153
0
}
154
155
0
void REJMAP::rej_word_bad_permuter() { // Reject whole word
156
0
  for (unsigned i = 0; i < len; i++) {
157
0
    if (ptr[i].accepted()) {
158
0
      ptr[i].setrej_bad_permuter();
159
0
    }
160
0
  }
161
0
}
162
163
0
void REJMAP::rej_word_xht_fixup() { // Reject whole word
164
0
  for (unsigned i = 0; i < len; i++) {
165
0
    if (ptr[i].accepted()) {
166
0
      ptr[i].setrej_xht_fixup();
167
0
    }
168
0
  }
169
0
}
170
171
0
void REJMAP::rej_word_no_alphanums() { // Reject whole word
172
0
  for (unsigned i = 0; i < len; i++) {
173
0
    if (ptr[i].accepted()) {
174
0
      ptr[i].setrej_no_alphanums();
175
0
    }
176
0
  }
177
0
}
178
179
0
void REJMAP::rej_word_mostly_rej() { // Reject whole word
180
0
  for (unsigned i = 0; i < len; i++) {
181
0
    if (ptr[i].accepted()) {
182
0
      ptr[i].setrej_mostly_rej();
183
0
    }
184
0
  }
185
0
}
186
187
0
void REJMAP::rej_word_bad_quality() { // Reject whole word
188
0
  for (unsigned i = 0; i < len; i++) {
189
0
    if (ptr[i].accepted()) {
190
0
      ptr[i].setrej_bad_quality();
191
0
    }
192
0
  }
193
0
}
194
195
0
void REJMAP::rej_word_doc_rej() { // Reject whole word
196
0
  for (unsigned i = 0; i < len; i++) {
197
0
    if (ptr[i].accepted()) {
198
0
      ptr[i].setrej_doc_rej();
199
0
    }
200
0
  }
201
0
}
202
203
0
void REJMAP::rej_word_block_rej() { // Reject whole word
204
0
  for (unsigned i = 0; i < len; i++) {
205
0
    if (ptr[i].accepted()) {
206
0
      ptr[i].setrej_block_rej();
207
0
    }
208
0
  }
209
0
}
210
211
0
void REJMAP::rej_word_row_rej() { // Reject whole word
212
0
  for (unsigned i = 0; i < len; i++) {
213
0
    if (ptr[i].accepted()) {
214
0
      ptr[i].setrej_row_rej();
215
0
    }
216
0
  }
217
0
}
218
219
} // namespace tesseract