/src/haproxy/src/dns_ring.c

Source
/*
 * Ring buffer management
 * This is a fork of ring.c for DNS usage.
 *
 * Copyright (C) 2000-2019 Willy Tarreau - w@1wt.eu
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation, version 2.1
 * exclusively.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
 */

#include <stdlib.h>
#include <haproxy/api.h>
#include <haproxy/applet.h>
#include <haproxy/buf.h>
#include <haproxy/cli.h>
#include <haproxy/dns_ring.h>
#include <haproxy/sc_strm.h>
#include <haproxy/stconn.h>
#include <haproxy/thread.h>

/* Initialize a pre-allocated ring with the buffer area
 * of size */
void dns_ring_init(struct dns_ring *ring, void *area, size_t size)
{
  HA_RWLOCK_INIT(&ring->lock);
  MT_LIST_INIT(&ring->waiters);
  ring->readers_count = 0;
  ring->buf = b_make(area, size, 0, 0);
  /* write the initial RC byte */
  b_putchr(&ring->buf, 0);
}

/* Creates and returns a ring buffer of size <size> bytes. Returns NULL on
 * allocation failure.
 */
struct dns_ring *dns_ring_new(size_t size)
{
  struct dns_ring *ring = NULL;
  void *area = NULL;

  if (size < 2)
    goto fail;

  ring = malloc(sizeof(*ring));
  if (!ring)
    goto fail;

  area = malloc(size);
  if (!area)
    goto fail;

  dns_ring_init(ring, area, size);
  return ring;
 fail:
  free(area);
  free(ring);
  return NULL;
}

/* destroys and frees ring <ring> */
void dns_ring_free(struct dns_ring *ring)
{
  if (!ring)
    return;

  free(ring->buf.area);
  free(ring);
}

/* Tries to send <npfx> parts from <prefix> followed by <nmsg> parts from <msg>
 * to ring <ring>. The message is sent atomically. It may be truncated to
 * <maxlen> bytes if <maxlen> is non-null. There is no distinction between the
 * two lists, it's just a convenience to help the caller prepend some prefixes
 * when necessary. It takes the ring's write lock to make sure no other thread
 * will touch the buffer during the update. Returns the number of bytes sent,
 * or <=0 on failure.
 */
ssize_t dns_ring_write(struct dns_ring *ring, size_t maxlen, const struct ist pfx[], size_t npfx, const struct ist msg[], size_t nmsg)
{
  struct buffer *buf = &ring->buf;
  struct appctx *appctx;
  size_t totlen = 0;
  size_t lenlen;
  uint64_t dellen;
  int dellenlen;
  struct mt_list back;
  ssize_t sent = 0;
  int i;

  /* we have to find some room to add our message (the buffer is
   * never empty and at least contains the previous counter) and
   * to update both the buffer contents and heads at the same
   * time (it's doable using atomic ops but not worth the
   * trouble, let's just lock). For this we first need to know
   * the total message's length. We cannot measure it while
   * copying due to the varint encoding of the length.
   */
  for (i = 0; i < npfx; i++)
    totlen += pfx[i].len;
  for (i = 0; i < nmsg; i++)
    totlen += msg[i].len;

  if (totlen > maxlen)
    totlen = maxlen;

  lenlen = varint_bytes(totlen);

  HA_RWLOCK_WRLOCK(RING_LOCK, &ring->lock);
  if (lenlen + totlen + 1 + 1 > b_size(buf))
    goto done_buf;

  while (b_room(buf) < lenlen + totlen + 1) {
    /* we need to delete the oldest message (from the end),
     * and we have to stop if there's a reader stuck there.
     * Unless there's corruption in the buffer it's guaranteed
     * that we have enough data to find 1 counter byte, a
     * varint-encoded length (1 byte min) and the message
     * payload (0 bytes min).
     */
    if (*b_head(buf))
      goto done_buf;
    dellenlen = b_peek_varint(buf, 1, &dellen);
    if (!dellenlen)
      goto done_buf;
    BUG_ON(b_data(buf) < 1 + dellenlen + dellen);

    b_del(buf, 1 + dellenlen + dellen);
  }

  /* OK now we do have room */
  __b_put_varint(buf, totlen);

  totlen = 0;
  for (i = 0; i < npfx; i++) {
    size_t len = pfx[i].len;

    if (len + totlen > maxlen)
      len = maxlen - totlen;
    if (len)
      __b_putblk(buf, pfx[i].ptr, len);
    totlen += len;
  }

  for (i = 0; i < nmsg; i++) {
    size_t len = msg[i].len;

    if (len + totlen > maxlen)
      len = maxlen - totlen;
    if (len)
      __b_putblk(buf, msg[i].ptr, len);
    totlen += len;
  }

  *b_tail(buf) = 0; buf->data++; // new read counter
  sent = lenlen + totlen + 1;

  /* notify potential readers */
  MT_LIST_FOR_EACH_ENTRY_LOCKED(appctx, &ring->waiters, wait_entry, back)
    appctx_wakeup(appctx);

 done_buf:
  HA_RWLOCK_WRUNLOCK(RING_LOCK, &ring->lock);
  return sent;
}

/* Tries to attach appctx <appctx> as a new reader on ring <ring>. This is
 * meant to be used by low level appctx code such as CLI or ring forwarding.
 * For higher level functions, please see the relevant parts in appctx or CLI.
 * It returns non-zero on success or zero on failure if too many users are
 * already attached. On success, the caller MUST call dns_ring_detach_appctx()
 * to detach itself, even if it was never woken up.
 */
int dns_ring_attach(struct dns_ring *ring)
{
  int users = ring->readers_count;

  do {
    if (users >= 255)
      return 0;
  } while (!_HA_ATOMIC_CAS(&ring->readers_count, &users, users + 1));
  return 1;
}

/* detach an appctx from a ring. The appctx is expected to be waiting at offset
 * <ofs> relative to the beginning of the storage, or ~0 if not waiting yet.
 * Nothing is done if <ring> is NULL.
 */
void dns_ring_detach_appctx(struct dns_ring *ring, struct appctx *appctx, size_t ofs)
{
  if (!ring)
    return;

  HA_RWLOCK_WRLOCK(RING_LOCK, &ring->lock);
  if (ofs != ~0) {
    /* reader was still attached */
    if (ofs < b_head_ofs(&ring->buf))
      ofs += b_size(&ring->buf) - b_head_ofs(&ring->buf);
    else
      ofs -= b_head_ofs(&ring->buf);

    BUG_ON(ofs >= b_size(&ring->buf));
    MT_LIST_DELETE(&appctx->wait_entry);
    HA_ATOMIC_DEC(b_peek(&ring->buf, ofs));
  }
  HA_ATOMIC_DEC(&ring->readers_count);
  HA_RWLOCK_WRUNLOCK(RING_LOCK, &ring->lock);
}

/*
 * Local variables:
 *  c-indent-level: 8
 *  c-basic-offset: 8
 * End:
 */

Coverage Report

Created: 2025-11-24 06:16

Line	Count	Source
1		/*
2		* Ring buffer management
3		* This is a fork of ring.c for DNS usage.
4		*
5		* Copyright (C) 2000-2019 Willy Tarreau - w@1wt.eu
6		*
7		* This library is free software; you can redistribute it and/or
8		* modify it under the terms of the GNU Lesser General Public
9		* License as published by the Free Software Foundation, version 2.1
10		* exclusively.
11		*
12		* This library is distributed in the hope that it will be useful,
13		* but WITHOUT ANY WARRANTY; without even the implied warranty of
14		* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15		* Lesser General Public License for more details.
16		*
17		* You should have received a copy of the GNU Lesser General Public
18		* License along with this library; if not, write to the Free Software
19		* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20		*/
21
22		#include <stdlib.h>
23		#include <haproxy/api.h>
24		#include <haproxy/applet.h>
25		#include <haproxy/buf.h>
26		#include <haproxy/cli.h>
27		#include <haproxy/dns_ring.h>
28		#include <haproxy/sc_strm.h>
29		#include <haproxy/stconn.h>
30		#include <haproxy/thread.h>
31
32		/* Initialize a pre-allocated ring with the buffer area
33		* of size */
34		void dns_ring_init(struct dns_ring ring, void area, size_t size)
35	0	{
36	0	HA_RWLOCK_INIT(&ring->lock);
37	0	MT_LIST_INIT(&ring->waiters);
38	0	ring->readers_count = 0;
39	0	ring->buf = b_make(area, size, 0, 0);
40		/* write the initial RC byte */
41	0	b_putchr(&ring->buf, 0);
42	0	}
43
44		/* Creates and returns a ring buffer of size <size> bytes. Returns NULL on
45		* allocation failure.
46		*/
47		struct dns_ring *dns_ring_new(size_t size)
48	0	{
49	0	struct dns_ring *ring = NULL;
50	0	void *area = NULL;
51
52	0	if (size < 2)
53	0	goto fail;
54
55	0	ring = malloc(sizeof(*ring));
56	0	if (!ring)
57	0	goto fail;
58
59	0	area = malloc(size);
60	0	if (!area)
61	0	goto fail;
62
63	0	dns_ring_init(ring, area, size);
64	0	return ring;
65	0	fail:
66	0	free(area);
67	0	free(ring);
68	0	return NULL;
69	0	}
70
71		/* destroys and frees ring <ring> */
72		void dns_ring_free(struct dns_ring *ring)
73	0	{
74	0	if (!ring)
75	0	return;
76
77	0	free(ring->buf.area);
78	0	free(ring);
79	0	}
80
81		/* Tries to send <npfx> parts from <prefix> followed by <nmsg> parts from <msg>
82		* to ring <ring>. The message is sent atomically. It may be truncated to
83		* <maxlen> bytes if <maxlen> is non-null. There is no distinction between the
84		* two lists, it's just a convenience to help the caller prepend some prefixes
85		* when necessary. It takes the ring's write lock to make sure no other thread
86		* will touch the buffer during the update. Returns the number of bytes sent,
87		* or <=0 on failure.
88		*/
89		ssize_t dns_ring_write(struct dns_ring *ring, size_t maxlen, const struct ist pfx[], size_t npfx, const struct ist msg[], size_t nmsg)
90	0	{
91	0	struct buffer *buf = &ring->buf;
92	0	struct appctx *appctx;
93	0	size_t totlen = 0;
94	0	size_t lenlen;
95	0	uint64_t dellen;
96	0	int dellenlen;
97	0	struct mt_list back;
98	0	ssize_t sent = 0;
99	0	int i;
100
101		/* we have to find some room to add our message (the buffer is
102		* never empty and at least contains the previous counter) and
103		* to update both the buffer contents and heads at the same
104		* time (it's doable using atomic ops but not worth the
105		* trouble, let's just lock). For this we first need to know
106		* the total message's length. We cannot measure it while
107		* copying due to the varint encoding of the length.
108		*/
109	0	for (i = 0; i < npfx; i++)
110	0	totlen += pfx[i].len;
111	0	for (i = 0; i < nmsg; i++)
112	0	totlen += msg[i].len;
113
114	0	if (totlen > maxlen)
115	0	totlen = maxlen;
116
117	0	lenlen = varint_bytes(totlen);
118
119	0	HA_RWLOCK_WRLOCK(RING_LOCK, &ring->lock);
120	0	if (lenlen + totlen + 1 + 1 > b_size(buf))
121	0	goto done_buf;
122
123	0	while (b_room(buf) < lenlen + totlen + 1) {
124		/* we need to delete the oldest message (from the end),
125		* and we have to stop if there's a reader stuck there.
126		* Unless there's corruption in the buffer it's guaranteed
127		* that we have enough data to find 1 counter byte, a
128		* varint-encoded length (1 byte min) and the message
129		* payload (0 bytes min).
130		*/
131	0	if (*b_head(buf))
132	0	goto done_buf;
133	0	dellenlen = b_peek_varint(buf, 1, &dellen);
134	0	if (!dellenlen)
135	0	goto done_buf;
136	0	BUG_ON(b_data(buf) < 1 + dellenlen + dellen);
137
138	0	b_del(buf, 1 + dellenlen + dellen);
139	0	}
140
141		/* OK now we do have room */
142	0	__b_put_varint(buf, totlen);
143
144	0	totlen = 0;
145	0	for (i = 0; i < npfx; i++) {
146	0	size_t len = pfx[i].len;
147
148	0	if (len + totlen > maxlen)
149	0	len = maxlen - totlen;
150	0	if (len)
151	0	__b_putblk(buf, pfx[i].ptr, len);
152	0	totlen += len;
153	0	}
154
155	0	for (i = 0; i < nmsg; i++) {
156	0	size_t len = msg[i].len;
157
158	0	if (len + totlen > maxlen)
159	0	len = maxlen - totlen;
160	0	if (len)
161	0	__b_putblk(buf, msg[i].ptr, len);
162	0	totlen += len;
163	0	}
164
165	0	*b_tail(buf) = 0; buf->data++; // new read counter
166	0	sent = lenlen + totlen + 1;
167
168		/* notify potential readers */
169	0	MT_LIST_FOR_EACH_ENTRY_LOCKED(appctx, &ring->waiters, wait_entry, back)
170	0	appctx_wakeup(appctx);
171
172	0	done_buf:
173	0	HA_RWLOCK_WRUNLOCK(RING_LOCK, &ring->lock);
174	0	return sent;
175	0	}
176
177		/* Tries to attach appctx <appctx> as a new reader on ring <ring>. This is
178		* meant to be used by low level appctx code such as CLI or ring forwarding.
179		* For higher level functions, please see the relevant parts in appctx or CLI.
180		* It returns non-zero on success or zero on failure if too many users are
181		* already attached. On success, the caller MUST call dns_ring_detach_appctx()
182		* to detach itself, even if it was never woken up.
183		*/
184		int dns_ring_attach(struct dns_ring *ring)
185	0	{
186	0	int users = ring->readers_count;
187
188	0	do {
189	0	if (users >= 255)
190	0	return 0;
191	0	} while (!_HA_ATOMIC_CAS(&ring->readers_count, &users, users + 1));
192	0	return 1;
193	0	}
194
195		/* detach an appctx from a ring. The appctx is expected to be waiting at offset
196		* <ofs> relative to the beginning of the storage, or ~0 if not waiting yet.
197		* Nothing is done if <ring> is NULL.
198		*/
199		void dns_ring_detach_appctx(struct dns_ring ring, struct appctx appctx, size_t ofs)
200	0	{
201	0	if (!ring)
202	0	return;
203
204	0	HA_RWLOCK_WRLOCK(RING_LOCK, &ring->lock);
205	0	if (ofs != ~0) {
206		/* reader was still attached */
207	0	if (ofs < b_head_ofs(&ring->buf))
208	0	ofs += b_size(&ring->buf) - b_head_ofs(&ring->buf);
209	0	else
210	0	ofs -= b_head_ofs(&ring->buf);
211
212	0	BUG_ON(ofs >= b_size(&ring->buf));
213	0	MT_LIST_DELETE(&appctx->wait_entry);
214	0	HA_ATOMIC_DEC(b_peek(&ring->buf, ofs));
215	0	}
216	0	HA_ATOMIC_DEC(&ring->readers_count);
217	0	HA_RWLOCK_WRUNLOCK(RING_LOCK, &ring->lock);
218	0	}
219
220		/*
221		* Local variables:
222		* c-indent-level: 8
223		* c-basic-offset: 8
224		* End:
225		*/