Coverage Report

Created: 2026-04-28 07:00

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/gnupg/common/mbox-util.c
Line
Count
Source
1
/* mbox-util.c - Mail address helper functions
2
 * Copyright (C) 1998-2010 Free Software Foundation, Inc.
3
 * Copyright (C) 1998-2015 Werner Koch
4
 *
5
 * This file is part of GnuPG.
6
 *
7
 * This file is free software; you can redistribute it and/or modify
8
 * it under the terms of the GNU Lesser General Public License as
9
 * published by the Free Software Foundation; either version 2.1 of
10
 * the License, or (at your option) any later version.
11
 *
12
 * This file is distributed in the hope that it will be useful,
13
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15
 * GNU General Public License for more details.
16
 *
17
 * You should have received a copy of the GNU Lesser General Public License
18
 * along with this program; if not, see <https://www.gnu.org/licenses/>.
19
 */
20
21
/* NB: GPGME uses the same code to reflect our idea on how to extract
22
 * a mail address from a user id.
23
 */
24
25
#include <config.h>
26
#include <stdio.h>
27
#include <stdlib.h>
28
#include <string.h>
29
#include <unistd.h>
30
#include <errno.h>
31
32
#include "util.h"
33
#include "mbox-util.h"
34
35
36
static int
37
string_count_chr (const char *string, int c)
38
2.80k
{
39
2.80k
  int count;
40
41
25.9k
  for (count=0; *string; string++ )
42
23.1k
    if ( *string == c )
43
3.04k
      count++;
44
2.80k
  return count;
45
2.80k
}
46
47
static int
48
mem_count_chr (const void *buffer, int c, size_t length)
49
13.0k
{
50
13.0k
  const char *s = buffer;
51
13.0k
  int count;
52
53
43.3k
  for (count=0; length; length--, s++)
54
30.2k
    if (*s == c)
55
5.72k
      count++;
56
13.0k
  return count;
57
13.0k
}
58
59
60
static int
61
string_has_ctrl_or_space (const char *string)
62
1.50k
{
63
15.5k
  for (; *string; string++ )
64
14.2k
    if (!(*string & 0x80) && *string <= 0x20)
65
216
      return 1;
66
1.29k
  return 0;
67
1.50k
}
68
69
70
/* Return true if STRING has two consecutive '.' after an '@'
71
   sign.  */
72
static int
73
has_dotdot_after_at (const char *string)
74
1.29k
{
75
1.29k
  string = strchr (string, '@');
76
1.29k
  if (!string)
77
0
    return 0; /* No at-sign.  */
78
1.29k
  string++;
79
1.29k
  return !!strstr (string, "..");
80
1.29k
}
81
82
83
/* Check whether BUFFER has characters not valid in an RFC-822
84
   address.  LENGTH gives the length of BUFFER.
85
86
   To cope with OpenPGP we ignore non-ascii characters so that for
87
   example umlauts are legal in an email address.  An OpenPGP user ID
88
   must be utf-8 encoded but there is no strict requirement for
89
   RFC-822.  Thus to avoid IDNA encoding we put the address verbatim
90
   as utf-8 into the user ID under the assumption that mail programs
91
   handle IDNA at a lower level and take OpenPGP user IDs as utf-8.
92
   Note that we can't do an utf-8 encoding checking here because in
93
   keygen.c this function is called with the native encoding and
94
   native to utf-8 encoding is only done later.  */
95
int
96
has_invalid_email_chars (const void *buffer, size_t length)
97
16.3k
{
98
16.3k
  const unsigned char *s = buffer;
99
16.3k
  int at_seen=0;
100
16.3k
  const char *valid_chars=
101
16.3k
    "01234567890_-.abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ";
102
103
51.0k
  for ( ; length && *s; length--, s++ )
104
37.9k
    {
105
37.9k
      if ((*s & 0x80))
106
12.1k
        continue; /* We only care about ASCII.  */
107
25.7k
      if (*s == '@')
108
7.63k
        at_seen=1;
109
18.1k
      else if (!at_seen && !(strchr (valid_chars, *s)
110
4.53k
                             || strchr ("!#$%&'*+/=?^`{|}~", *s)))
111
1.32k
        return 1;
112
16.8k
      else if (at_seen && !strchr (valid_chars, *s))
113
1.91k
        return 1;
114
25.7k
    }
115
13.0k
  return 0;
116
16.3k
}
117
118
119
/* Same as is_valid_mailbox (see below) but operates on non-nul
120
   terminated buffer.  */
121
int
122
is_valid_mailbox_mem (const void *name_arg, size_t namelen)
123
16.3k
{
124
16.3k
  const char *name = name_arg;
125
126
16.3k
  return !( !name
127
16.3k
            || !namelen
128
16.3k
            || has_invalid_email_chars (name, namelen)
129
13.0k
            || mem_count_chr (name, '@', namelen) != 1
130
3.92k
            || *name == '@'
131
3.33k
            || name[namelen-1] == '@'
132
2.86k
            || name[namelen-1] == '.'
133
1.62k
            || gnupg_memstr (name, namelen, ".."));
134
16.3k
}
135
136
137
/* Check whether NAME represents a valid mailbox according to
138
   RFC822. Returns true if so. */
139
int
140
is_valid_mailbox (const char *name)
141
16.3k
{
142
16.3k
  return name? is_valid_mailbox_mem (name, strlen (name)) : 0;
143
16.3k
}
144
145
146
/* Return the mailbox (local-part@domain) form a standard user id.
147
 * All plain ASCII characters in the result are converted to
148
 * lowercase.  If SUBADDRESS is 1, '+' denoted sub-addresses are not
149
 * included in the result.  Caller must free the result.  Returns NULL
150
 * if no valid mailbox was found (or we are out of memory). */
151
char *
152
mailbox_from_userid (const char *userid, int subaddress)
153
19.8k
{
154
19.8k
  const char *s, *s_end;
155
19.8k
  size_t len;
156
19.8k
  char *result = NULL;
157
158
19.8k
  s = strchr (userid, '<');
159
19.8k
  if (s)
160
3.51k
    {
161
      /* Seems to be a standard user id.  */
162
3.51k
      s++;
163
3.51k
      s_end = strchr (s, '>');
164
3.51k
      if (s_end && s_end > s)
165
2.80k
        {
166
2.80k
          len = s_end - s;
167
2.80k
          result = xtrymalloc (len + 1);
168
2.80k
          if (!result)
169
0
            return NULL; /* Ooops - out of core.  */
170
2.80k
          strncpy (result, s, len);
171
2.80k
          result[len] = 0;
172
          /* Apply some basic checks on the address.  We do not use
173
             is_valid_mailbox because those checks are too strict.  */
174
2.80k
          if (string_count_chr (result, '@') != 1  /* Need exactly one '@.  */
175
2.51k
              || *result == '@'           /* local-part missing.  */
176
2.38k
              || result[len-1] == '@'     /* domain missing.  */
177
2.23k
              || result[len-1] == '.'     /* ends with a dot.  */
178
1.50k
              || string_has_ctrl_or_space (result)
179
1.29k
              || has_dotdot_after_at (result))
180
1.84k
            {
181
1.84k
              xfree (result);
182
1.84k
              result = NULL;
183
1.84k
              errno = EINVAL;
184
1.84k
            }
185
2.80k
        }
186
715
      else
187
3.51k
        errno = EINVAL;
188
3.51k
    }
189
16.3k
  else if (is_valid_mailbox (userid))
190
1.25k
    {
191
      /* The entire user id is a mailbox.  Return that one.  Note that
192
         this fallback method has some restrictions on the valid
193
         syntax of the mailbox.  However, those who want weird
194
         addresses should know about it and use the regular <...>
195
         syntax.  */
196
1.25k
      result = xtrystrdup (userid);
197
1.25k
    }
198
15.0k
  else
199
16.3k
    errno = EINVAL;
200
201
19.8k
  if (result && subaddress == 1)
202
0
    {
203
0
      char *atsign, *plus;
204
205
0
      if ((atsign = strchr (result, '@')))
206
0
        {
207
          /* We consider a subaddress only if there is a single '+'
208
           * in the local part and the '+' is not the first or last
209
           * character.  */
210
0
          *atsign = 0;
211
0
          if ((plus = strchr (result, '+'))
212
0
              && !strchr (plus+1, '+')
213
0
              && result != plus
214
0
              && plus[1] )
215
0
            {
216
0
              *atsign = '@';
217
0
              memmove (plus, atsign, strlen (atsign)+1);
218
0
            }
219
0
          else
220
0
            *atsign = '@';
221
0
        }
222
0
    }
223
224
19.8k
  return result? ascii_strlwr (result): NULL;
225
19.8k
}
226
227
228
/* Check whether UID is a valid standard user id of the form
229
     "Heinrich Heine <heinrichh@duesseldorf.de>"
230
   and return true if this is the case. */
231
int
232
is_valid_user_id (const char *uid)
233
0
{
234
0
  if (!uid || !*uid)
235
0
    return 0;
236
237
0
  return 1;
238
0
}
239
240
241
/* Returns true if STRING is a valid domain name according to the LDH
242
 * rule. */
243
int
244
is_valid_domain_name (const char *string)
245
0
{
246
0
  static char const ldh_chars[] =
247
0
    "01234567890abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ-";
248
0
  const char *s;
249
250
  /* Note that we do not check the length limit of a label or the
251
   * entire name */
252
253
0
  for (s=string; *s; s++)
254
0
    if (*s == '.')
255
0
      {
256
0
        if (string == s)
257
0
          return 0; /* Dot at the start of the string.  */
258
                    /* (may also be at the end like in ".") */
259
0
        if (s[1] == '.')
260
0
          return 0; /* No - double dot.  */
261
0
      }
262
0
    else if (!strchr (ldh_chars, *s))
263
0
      return 0;
264
0
    else if (*s == '-')
265
0
      {
266
0
        if (string == s)
267
0
          return 0;  /* Leading hyphen.  */
268
0
        if (s[-1] == '.')
269
0
          return 0;  /* Hyphen at begin of a label.  */
270
0
        if (s[1] == '.')
271
0
          return 0;  /* Hyphen at start of a label.  */
272
0
        if (!s[1])
273
0
          return 0;  /* Trailing hyphen.  */
274
0
      }
275
276
0
  return !!*string;
277
0
}