Coverage Report

Created: 2025-11-09 07:04

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/aspell/modules/tokenizer/basic.cpp
Line
Count
Source
1
2
// This file is part of The New Aspell
3
// Copyright (C) 2001 by Kevin Atkinson under the GNU LGPL license
4
// version 2.0 or 2.1.  You should have received a copy of the LGPL
5
// license along with this library if you did not you can find
6
// it at http://www.gnu.org/.
7
8
#include "tokenizer.hpp"
9
#include "convert.hpp"
10
#include "speller.hpp"
11
12
13
namespace acommon {
14
15
  class TokenizerBasic : public Tokenizer
16
  {
17
  public:
18
    bool advance();
19
  };
20
21
43.0k
  bool TokenizerBasic::advance() {
22
43.0k
    word_begin = word_end;
23
43.0k
    begin_pos = end_pos;
24
43.0k
    FilterChar * cur = word_begin;
25
43.0k
    unsigned int cur_pos = begin_pos;
26
43.0k
    word.clear();
27
28
    // skip spaces (non-word characters)
29
2.17M
    while (*cur != 0 &&
30
2.17M
     !(is_word(*cur)
31
2.12M
       || (is_begin(*cur) && is_word(cur[1])))) 
32
2.12M
    {
33
2.12M
      cur_pos += cur->width;
34
2.12M
      ++cur;
35
2.12M
    }
36
37
43.0k
    if (*cur == 0) return false;
38
39
41.9k
    word_begin = cur;
40
41.9k
    begin_pos = cur_pos;
41
42
41.9k
    if (is_begin(*cur) && is_word(cur[1]))
43
242
    {
44
242
      cur_pos += cur->width;
45
242
      ++cur;
46
242
    }
47
48
26.4M
    while (is_word(*cur) || 
49
222k
     (is_middle(*cur) && 
50
180k
      cur > word_begin && is_word(cur[-1]) &&
51
180k
      is_word(cur[1]) )) 
52
26.3M
    {
53
26.3M
      word.append(*cur);
54
26.3M
      cur_pos += cur->width;
55
26.3M
      ++cur;
56
26.3M
    }
57
58
41.9k
    if (is_end(*cur))
59
1.06k
    {
60
1.06k
      word.append(*cur);
61
1.06k
      cur_pos += cur->width;
62
1.06k
      ++cur;
63
1.06k
    }
64
65
41.9k
    word.append('\0');
66
41.9k
    word_end = cur;
67
41.9k
    end_pos = cur_pos;
68
69
41.9k
    return true;
70
43.0k
  }
71
#undef increment__
72
73
  PosibErr<Tokenizer *> new_tokenizer(Speller * speller)
74
1.12k
  {
75
1.12k
    Tokenizer * tok = new TokenizerBasic();
76
1.12k
    speller->setup_tokenizer(tok);
77
1.12k
    return tok;
78
1.12k
  }
79
80
}