/src/tesseract/src/ccstruct/rejctmap.cpp
Line | Count | Source (jump to first uncovered line) |
1 | | /********************************************************************** |
2 | | * File: rejctmap.cpp (Formerly rejmap.c) |
3 | | * Description: REJ and REJMAP class functions. |
4 | | * Author: Phil Cheatle |
5 | | * |
6 | | * (C) Copyright 1994, Hewlett-Packard Ltd. |
7 | | ** Licensed under the Apache License, Version 2.0 (the "License"); |
8 | | ** you may not use this file except in compliance with the License. |
9 | | ** You may obtain a copy of the License at |
10 | | ** http://www.apache.org/licenses/LICENSE-2.0 |
11 | | ** Unless required by applicable law or agreed to in writing, software |
12 | | ** distributed under the License is distributed on an "AS IS" BASIS, |
13 | | ** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
14 | | ** See the License for the specific language governing permissions and |
15 | | ** limitations under the License. |
16 | | * |
17 | | **********************************************************************/ |
18 | | |
19 | | #include "rejctmap.h" |
20 | | |
21 | | #include <memory> |
22 | | |
23 | | #include "params.h" |
24 | | |
25 | | namespace tesseract { |
26 | | |
27 | 0 | void REJ::full_print(FILE *fp) const { |
28 | 0 | fprintf(fp, "R_TESS_FAILURE: %s\n", flag(R_TESS_FAILURE) ? "T" : "F"); |
29 | 0 | fprintf(fp, "R_SMALL_XHT: %s\n", flag(R_SMALL_XHT) ? "T" : "F"); |
30 | 0 | fprintf(fp, "R_EDGE_CHAR: %s\n", flag(R_EDGE_CHAR) ? "T" : "F"); |
31 | 0 | fprintf(fp, "R_1IL_CONFLICT: %s\n", flag(R_1IL_CONFLICT) ? "T" : "F"); |
32 | 0 | fprintf(fp, "R_POSTNN_1IL: %s\n", flag(R_POSTNN_1IL) ? "T" : "F"); |
33 | 0 | fprintf(fp, "R_REJ_CBLOB: %s\n", flag(R_REJ_CBLOB) ? "T" : "F"); |
34 | 0 | fprintf(fp, "R_MM_REJECT: %s\n", flag(R_MM_REJECT) ? "T" : "F"); |
35 | 0 | fprintf(fp, "R_BAD_REPETITION: %s\n", flag(R_BAD_REPETITION) ? "T" : "F"); |
36 | 0 | fprintf(fp, "R_POOR_MATCH: %s\n", flag(R_POOR_MATCH) ? "T" : "F"); |
37 | 0 | fprintf(fp, "R_NOT_TESS_ACCEPTED: %s\n", |
38 | 0 | flag(R_NOT_TESS_ACCEPTED) ? "T" : "F"); |
39 | 0 | fprintf(fp, "R_CONTAINS_BLANKS: %s\n", flag(R_CONTAINS_BLANKS) ? "T" : "F"); |
40 | 0 | fprintf(fp, "R_BAD_PERMUTER: %s\n", flag(R_BAD_PERMUTER) ? "T" : "F"); |
41 | 0 | fprintf(fp, "R_HYPHEN: %s\n", flag(R_HYPHEN) ? "T" : "F"); |
42 | 0 | fprintf(fp, "R_DUBIOUS: %s\n", flag(R_DUBIOUS) ? "T" : "F"); |
43 | 0 | fprintf(fp, "R_NO_ALPHANUMS: %s\n", flag(R_NO_ALPHANUMS) ? "T" : "F"); |
44 | 0 | fprintf(fp, "R_MOSTLY_REJ: %s\n", flag(R_MOSTLY_REJ) ? "T" : "F"); |
45 | 0 | fprintf(fp, "R_XHT_FIXUP: %s\n", flag(R_XHT_FIXUP) ? "T" : "F"); |
46 | 0 | fprintf(fp, "R_BAD_QUALITY: %s\n", flag(R_BAD_QUALITY) ? "T" : "F"); |
47 | 0 | fprintf(fp, "R_DOC_REJ: %s\n", flag(R_DOC_REJ) ? "T" : "F"); |
48 | 0 | fprintf(fp, "R_BLOCK_REJ: %s\n", flag(R_BLOCK_REJ) ? "T" : "F"); |
49 | 0 | fprintf(fp, "R_ROW_REJ: %s\n", flag(R_ROW_REJ) ? "T" : "F"); |
50 | 0 | fprintf(fp, "R_UNLV_REJ: %s\n", flag(R_UNLV_REJ) ? "T" : "F"); |
51 | 0 | fprintf(fp, "R_HYPHEN_ACCEPT: %s\n", flag(R_HYPHEN_ACCEPT) ? "T" : "F"); |
52 | 0 | fprintf(fp, "R_NN_ACCEPT: %s\n", flag(R_NN_ACCEPT) ? "T" : "F"); |
53 | 0 | fprintf(fp, "R_MM_ACCEPT: %s\n", flag(R_MM_ACCEPT) ? "T" : "F"); |
54 | 0 | fprintf(fp, "R_QUALITY_ACCEPT: %s\n", flag(R_QUALITY_ACCEPT) ? "T" : "F"); |
55 | 0 | fprintf(fp, "R_MINIMAL_REJ_ACCEPT: %s\n", |
56 | 0 | flag(R_MINIMAL_REJ_ACCEPT) ? "T" : "F"); |
57 | 0 | } |
58 | | |
59 | 44.4k | REJMAP &REJMAP::operator=(const REJMAP &source) { |
60 | 44.4k | initialise(source.len); |
61 | 240k | for (unsigned i = 0; i < len; i++) { |
62 | 196k | ptr[i] = source.ptr[i]; |
63 | 196k | } |
64 | 44.4k | return *this; |
65 | 44.4k | } |
66 | | |
67 | 127k | void REJMAP::initialise(uint16_t length) { |
68 | 127k | ptr = std::make_unique<REJ[]>(length); |
69 | 127k | len = length; |
70 | 127k | } |
71 | | |
72 | 0 | int16_t REJMAP::accept_count() const { // How many accepted? |
73 | 0 | int16_t count = 0; |
74 | 0 | for (unsigned i = 0; i < len; i++) { |
75 | 0 | if (ptr[i].accepted()) { |
76 | 0 | count++; |
77 | 0 | } |
78 | 0 | } |
79 | 0 | return count; |
80 | 0 | } |
81 | | |
82 | 0 | bool REJMAP::recoverable_rejects() const { // Any non perm rejs? |
83 | 0 | for (unsigned i = 0; i < len; i++) { |
84 | 0 | if (ptr[i].recoverable()) { |
85 | 0 | return true; |
86 | 0 | } |
87 | 0 | } |
88 | 0 | return false; |
89 | 0 | } |
90 | | |
91 | 0 | bool REJMAP::quality_recoverable_rejects() const { // Any potential rejs? |
92 | 0 | for (unsigned i = 0; i < len; i++) { |
93 | 0 | if (ptr[i].accept_if_good_quality()) { |
94 | 0 | return true; |
95 | 0 | } |
96 | 0 | } |
97 | 0 | return false; |
98 | 0 | } |
99 | | |
100 | | void REJMAP::remove_pos( // Cut out an element |
101 | | uint16_t pos // element to remove |
102 | 236 | ) { |
103 | 236 | ASSERT_HOST(pos < len); |
104 | 236 | ASSERT_HOST(len > 0); |
105 | | |
106 | 236 | len--; |
107 | 5.12k | for (; pos < len; pos++) { |
108 | 4.88k | ptr[pos] = ptr[pos + 1]; |
109 | 4.88k | } |
110 | 236 | } |
111 | | |
112 | 0 | void REJMAP::print(FILE *fp) const { |
113 | 0 | fputc('"', fp); |
114 | 0 | for (unsigned i = 0; i < len; i++) { |
115 | 0 | fputc( ptr[i].display_char(), fp); |
116 | 0 | } |
117 | 0 | fputc('"', fp); |
118 | 0 | } |
119 | | |
120 | 0 | void REJMAP::full_print(FILE *fp) const { |
121 | 0 | for (unsigned i = 0; i < len; i++) { |
122 | 0 | ptr[i].full_print(fp); |
123 | 0 | fprintf(fp, "\n"); |
124 | 0 | } |
125 | 0 | } |
126 | | |
127 | 0 | void REJMAP::rej_word_small_xht() { // Reject whole word |
128 | 0 | for (unsigned i = 0; i < len; i++) { |
129 | 0 | ptr[i].setrej_small_xht(); |
130 | 0 | } |
131 | 0 | } |
132 | | |
133 | 4 | void REJMAP::rej_word_tess_failure() { // Reject whole word |
134 | 8 | for (unsigned i = 0; i < len; i++) { |
135 | 4 | ptr[i].setrej_tess_failure(); |
136 | 4 | } |
137 | 4 | } |
138 | | |
139 | 0 | void REJMAP::rej_word_not_tess_accepted() { // Reject whole word |
140 | 0 | for (unsigned i = 0; i < len; i++) { |
141 | 0 | if (ptr[i].accepted()) { |
142 | 0 | ptr[i].setrej_not_tess_accepted(); |
143 | 0 | } |
144 | 0 | } |
145 | 0 | } |
146 | | |
147 | 0 | void REJMAP::rej_word_contains_blanks() { // Reject whole word |
148 | 0 | for (unsigned i = 0; i < len; i++) { |
149 | 0 | if (ptr[i].accepted()) { |
150 | 0 | ptr[i].setrej_contains_blanks(); |
151 | 0 | } |
152 | 0 | } |
153 | 0 | } |
154 | | |
155 | 0 | void REJMAP::rej_word_bad_permuter() { // Reject whole word |
156 | 0 | for (unsigned i = 0; i < len; i++) { |
157 | 0 | if (ptr[i].accepted()) { |
158 | 0 | ptr[i].setrej_bad_permuter(); |
159 | 0 | } |
160 | 0 | } |
161 | 0 | } |
162 | | |
163 | 0 | void REJMAP::rej_word_xht_fixup() { // Reject whole word |
164 | 0 | for (unsigned i = 0; i < len; i++) { |
165 | 0 | if (ptr[i].accepted()) { |
166 | 0 | ptr[i].setrej_xht_fixup(); |
167 | 0 | } |
168 | 0 | } |
169 | 0 | } |
170 | | |
171 | 0 | void REJMAP::rej_word_no_alphanums() { // Reject whole word |
172 | 0 | for (unsigned i = 0; i < len; i++) { |
173 | 0 | if (ptr[i].accepted()) { |
174 | 0 | ptr[i].setrej_no_alphanums(); |
175 | 0 | } |
176 | 0 | } |
177 | 0 | } |
178 | | |
179 | 0 | void REJMAP::rej_word_mostly_rej() { // Reject whole word |
180 | 0 | for (unsigned i = 0; i < len; i++) { |
181 | 0 | if (ptr[i].accepted()) { |
182 | 0 | ptr[i].setrej_mostly_rej(); |
183 | 0 | } |
184 | 0 | } |
185 | 0 | } |
186 | | |
187 | 0 | void REJMAP::rej_word_bad_quality() { // Reject whole word |
188 | 0 | for (unsigned i = 0; i < len; i++) { |
189 | 0 | if (ptr[i].accepted()) { |
190 | 0 | ptr[i].setrej_bad_quality(); |
191 | 0 | } |
192 | 0 | } |
193 | 0 | } |
194 | | |
195 | 0 | void REJMAP::rej_word_doc_rej() { // Reject whole word |
196 | 0 | for (unsigned i = 0; i < len; i++) { |
197 | 0 | if (ptr[i].accepted()) { |
198 | 0 | ptr[i].setrej_doc_rej(); |
199 | 0 | } |
200 | 0 | } |
201 | 0 | } |
202 | | |
203 | 0 | void REJMAP::rej_word_block_rej() { // Reject whole word |
204 | 0 | for (unsigned i = 0; i < len; i++) { |
205 | 0 | if (ptr[i].accepted()) { |
206 | 0 | ptr[i].setrej_block_rej(); |
207 | 0 | } |
208 | 0 | } |
209 | 0 | } |
210 | | |
211 | 0 | void REJMAP::rej_word_row_rej() { // Reject whole word |
212 | 0 | for (unsigned i = 0; i < len; i++) { |
213 | 0 | if (ptr[i].accepted()) { |
214 | 0 | ptr[i].setrej_row_rej(); |
215 | 0 | } |
216 | 0 | } |
217 | 0 | } |
218 | | |
219 | | } // namespace tesseract |