Coverage Report

Created: 2024-11-25 06:29

/src/nettle/memxor.c
Line
Count
Source
1
/* memxor.c
2
3
   Copyright (C) 2010, 2014 Niels Möller
4
5
   This file is part of GNU Nettle.
6
7
   GNU Nettle is free software: you can redistribute it and/or
8
   modify it under the terms of either:
9
10
     * the GNU Lesser General Public License as published by the Free
11
       Software Foundation; either version 3 of the License, or (at your
12
       option) any later version.
13
14
   or
15
16
     * the GNU General Public License as published by the Free
17
       Software Foundation; either version 2 of the License, or (at your
18
       option) any later version.
19
20
   or both in parallel, as here.
21
22
   GNU Nettle is distributed in the hope that it will be useful,
23
   but WITHOUT ANY WARRANTY; without even the implied warranty of
24
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
25
   General Public License for more details.
26
27
   You should have received copies of the GNU General Public License and
28
   the GNU Lesser General Public License along with this program.  If
29
   not, see http://www.gnu.org/licenses/.
30
*/
31
32
/* Implementation inspired by memcmp in glibc, contributed to the FSF
33
   by Torbjorn Granlund.
34
 */
35
36
#if HAVE_CONFIG_H
37
# include "config.h"
38
#endif
39
40
#include <assert.h>
41
#include <limits.h>
42
43
#include "memxor.h"
44
#include "memxor-internal.h"
45
46
207k
#define WORD_T_THRESH 16
47
48
/* XOR word-aligned areas. n is the number of words, not bytes. */
49
static void
50
memxor_common_alignment (word_t *dst, const word_t *src, size_t n)
51
90.7k
{
52
  /* FIXME: Require n > 0? */
53
  /* FIXME: Unroll four times, like memcmp? Probably not worth the
54
     effort. */
55
56
90.7k
  if (n & 1)
57
112
    {
58
112
      n--;
59
112
      dst[n] ^= src[n];
60
112
    }
61
290k
  while (n >= 2)
62
199k
    {
63
199k
      n -= 2;
64
199k
      dst[n+1] ^= src[n+1];
65
199k
      dst[n] ^= src[n];
66
199k
    }
67
90.7k
}
68
69
/* XOR *un-aligned* src-area onto aligned dst area. n is number of
70
   words, not bytes. Assumes we can read complete words at the start
71
   and end of the src operand. */
72
static void
73
memxor_different_alignment (word_t *dst, const unsigned char *src, size_t n)
74
83.6k
{
75
83.6k
  int shl, shr;
76
83.6k
  const word_t *src_word;
77
83.6k
  unsigned offset = ALIGN_OFFSET (src);
78
83.6k
  word_t s0, s1;
79
80
83.6k
  assert (n > 0);
81
83.6k
  shl = CHAR_BIT * offset;
82
83.6k
  shr = CHAR_BIT * (sizeof(word_t) - offset);
83
84
83.6k
  src_word = (const word_t *) ((uintptr_t) src & -sizeof(word_t));
85
86
  /* Read top offset bytes, in native byte order. */
87
83.6k
  READ_PARTIAL (s0, (unsigned char *) &src_word[n], offset);
88
#ifdef WORDS_BIGENDIAN
89
  s0 <<= shr; /* FIXME: Eliminate this shift? */
90
#endif
91
92
  /* Do n-1 regular iterations */
93
83.6k
  if (n & 1)
94
9.02k
    s1 = s0;
95
74.6k
  else
96
74.6k
    {
97
74.6k
      n--;
98
74.6k
      s1 = src_word[n];
99
74.6k
      dst[n] ^= MERGE (s1, shl, s0, shr);
100
74.6k
    }
101
102
83.6k
  assert (n & 1);
103
252k
  while (n > 2)
104
168k
    {
105
168k
      n -= 2;
106
168k
      s0 = src_word[n+1];
107
168k
      dst[n+1] ^= MERGE(s0, shl, s1, shr);
108
168k
      s1 = src_word[n]; /* FIXME: Overread on last iteration */
109
168k
      dst[n] ^= MERGE(s1, shl, s0, shr);
110
168k
    }
111
83.6k
  assert (n == 1);
112
  /* Read low wordsize - offset bytes */
113
83.6k
  READ_PARTIAL (s0, src, sizeof(word_t) - offset);
114
83.6k
#ifndef WORDS_BIGENDIAN
115
83.6k
  s0 <<= shl; /* FIXME: eliminate shift? */
116
83.6k
#endif /* !WORDS_BIGENDIAN */
117
118
83.6k
  dst[0] ^= MERGE(s0, shl, s1, shr);
119
83.6k
}
120
121
/* Performance, Intel SU1400 (x86_64): 0.25 cycles/byte aligned, 0.45
122
   cycles/byte unaligned. */
123
124
/* XOR LEN bytes starting at SRCADDR onto DESTADDR. Result undefined
125
   if the source overlaps with the destination. Return DESTADDR. */
126
void *
127
memxor(void *dst_in, const void *src_in, size_t n)
128
207k
{
129
207k
  unsigned char *dst = dst_in;
130
207k
  const unsigned char *src = src_in;
131
132
207k
  if (n >= WORD_T_THRESH)
133
174k
    {
134
174k
      unsigned i;
135
174k
      unsigned offset;
136
174k
      size_t nwords;
137
      /* There are at least some bytes to compare.  No need to test
138
   for N == 0 in this alignment loop.  */
139
176k
      for (i = ALIGN_OFFSET(dst + n); i > 0; i--)
140
2.25k
  {
141
2.25k
    n--;
142
2.25k
    dst[n] ^= src[n];
143
2.25k
  }
144
174k
      offset = ALIGN_OFFSET(src + n);
145
174k
      nwords = n / sizeof (word_t);
146
174k
      n %= sizeof (word_t);
147
148
174k
      if (offset)
149
83.6k
  memxor_different_alignment ((word_t *) (dst+n), src+n, nwords);
150
90.7k
      else
151
90.7k
  memxor_common_alignment ((word_t *) (dst+n),
152
90.7k
         (const word_t *) (src+n), nwords);
153
174k
    }
154
431k
  while (n > 0)
155
223k
    {
156
223k
      n--;
157
223k
      dst[n] ^= src[n];
158
223k
    }
159
160
207k
  return dst;
161
207k
}