public inbox for passt-dev@passt.top
 help / color / mirror / code / Atom feed
5bc9509a1b980bbece49ba1e6a7b30dc313b49cc blob 6198 bytes (raw)

  1
  2
  3
  4
  5
  6
  7
  8
  9
 10
 11
 12
 13
 14
 15
 16
 17
 18
 19
 20
 21
 22
 23
 24
 25
 26
 27
 28
 29
 30
 31
 32
 33
 34
 35
 36
 37
 38
 39
 40
 41
 42
 43
 44
 45
 46
 47
 48
 49
 50
 51
 52
 53
 54
 55
 56
 57
 58
 59
 60
 61
 62
 63
 64
 65
 66
 67
 68
 69
 70
 71
 72
 73
 74
 75
 76
 77
 78
 79
 80
 81
 82
 83
 84
 85
 86
 87
 88
 89
 90
 91
 92
 93
 94
 95
 96
 97
 98
 99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
 
// SPDX-License-Identifier: GPL-2.0-or-later
/* udp_vu.c - UDP L2 vhost-user management functions
 *
 * Copyright Red Hat
 * Author: Laurent Vivier <lvivier@redhat.com>
 */

#include <unistd.h>
#include <assert.h>
#include <net/ethernet.h>
#include <net/if.h>
#include <netinet/in.h>
#include <netinet/ip.h>
#include <netinet/udp.h>
#include <stdint.h>
#include <stddef.h>
#include <sys/uio.h>
#include <linux/virtio_net.h>

#include "checksum.h"
#include "util.h"
#include "ip.h"
#include "siphash.h"
#include "inany.h"
#include "passt.h"
#include "pcap.h"
#include "log.h"
#include "vhost_user.h"
#include "udp_internal.h"
#include "flow.h"
#include "flow_table.h"
#include "udp_flow.h"
#include "udp_vu.h"
#include "vu_common.h"

/**
 * udp_vu_hdrlen() - Sum size of all headers, from UDP to virtio-net
 * @v6:		Set for IPv6 packet
 *
 * Return: total size of virtio-net, Ethernet, IP, and UDP headers
 */
static size_t udp_vu_hdrlen(bool v6)
{
	size_t hdrlen;

	hdrlen = VNET_HLEN + sizeof(struct ethhdr) + sizeof(struct udphdr);

	if (v6)
		hdrlen += sizeof(struct ipv6hdr);
	else
		hdrlen += sizeof(struct iphdr);

	return hdrlen;
}

/**
 * udp_vu_sock_recv() - Receive datagrams from socket into vhost-user buffers
 * @iov:	IO vector for the frame (in/out)
 * @cnt:	Number of IO vector entries (in/out)
 * @s:		Socket to receive from
 * @v6:		Set for IPv6 connections
 *
 * Return: size of received data, -1 on error
 */
static ssize_t udp_vu_sock_recv(struct iovec *iov, size_t *cnt, int s, bool v6)
{
	struct iovec msg_iov[*cnt];
	struct msghdr msg  = { 0 };
	struct iov_tail payload;
	size_t hdrlen, iov_used;
	ssize_t dlen;

	/* compute L2 header length */
	hdrlen = udp_vu_hdrlen(v6);

	payload = IOV_TAIL(iov, *cnt, hdrlen);

	msg.msg_iov = msg_iov;
	msg.msg_iovlen = iov_tail_clone(msg.msg_iov, payload.cnt, &payload);

	/* read data from the socket */
	dlen = recvmsg(s, &msg, 0);
	if (dlen < 0)
		return -1;

	iov_used = iov_skip_bytes(iov, *cnt,
				  MAX(dlen + hdrlen, VNET_HLEN + ETH_ZLEN),
				  NULL);
	if (iov_used < *cnt)
		iov_used++;
	*cnt = iov_used; /* one iovec per element */

	return dlen;
}

/**
 * udp_vu_prepare() - Prepare the packet header
 * @c:		Execution context
 * @data:	IO vector tail for the frame,
 * 		on return, points to the L3 frame
 * @toside:	Address information for one side of the flow
 * @dlen:	Packet data length
 *
 * Return: Layer-4 length
 */
static size_t udp_vu_prepare(const struct ctx *c, struct iov_tail *data,
			     const struct flowside *toside, size_t dlen)
{
	bool ipv4 = inany_v4(&toside->eaddr) && inany_v4(&toside->oaddr);
	struct ethhdr eh;
	size_t l4len;

	/* ethernet header */
	memcpy(eh.h_dest, c->guest_mac, sizeof(eh.h_dest));
	memcpy(eh.h_source, c->our_tap_mac, sizeof(eh.h_source));

	if (ipv4)
		eh.h_proto = htons(ETH_P_IP);
	else
		eh.h_proto = htons(ETH_P_IPV6);
	IOV_PUSH_HEADER(data, eh);

	/* initialize header */
	if (ipv4) {
		struct iov_tail udp_frame;
		struct iphdr iph;

		iph = (struct iphdr)L2_BUF_IP4_INIT(IPPROTO_UDP);

		udp_frame = *data;
		IOV_DROP_HEADER(&udp_frame, struct iphdr);
		l4len = udp_update_hdr4(&iph, &udp_frame, toside, dlen, true);

		IOV_PUSH_HEADER(data, iph);
	} else {
		struct iov_tail udp_frame;
		struct ipv6hdr ip6h;

		ip6h = (struct ipv6hdr)L2_BUF_IP6_INIT(IPPROTO_UDP);

		udp_frame = *data;
		IOV_DROP_HEADER(&udp_frame, struct ipv6hdr);
		l4len = udp_update_hdr6(&ip6h, &udp_frame, toside, dlen, true);

		IOV_PUSH_HEADER(data, ip6h);
	}

	return l4len;
}

/**
 * udp_vu_csum() - Calculate and set checksum for a UDP packet
 * @toside:	Address information for one side of the flow
 * @data:	IO vector tail for the L3 frame
 * @l4len:	L4 length
 */
static void udp_vu_csum(const struct flowside *toside, struct iov_tail *data,
			size_t l4len)
{
	const struct in_addr *src4 = inany_v4(&toside->oaddr);
	const struct in_addr *dst4 = inany_v4(&toside->eaddr);
	struct udphdr *uh, uh_storage;
	bool ipv4 = src4 && dst4;

	uh = IOV_REMOVE_HEADER(data, uh_storage);

	if (ipv4)
		csum_udp4(uh, *src4, *dst4, data, l4len);
	else
		csum_udp6(uh, &toside->oaddr.a6, &toside->eaddr.a6, data, l4len);
}

/**
 * udp_vu_sock_to_tap() - Forward datagrams from socket to tap
 * @c:		Execution context
 * @s:		Socket to read data from
 * @n:		Maximum number of datagrams to forward
 * @tosidx:	Flow & side to forward data from @s to
 */
void udp_vu_sock_to_tap(const struct ctx *c, int s, int n, flow_sidx_t tosidx)
{
	const struct flowside *toside = flowside_at_sidx(tosidx);
	static struct vu_virtq_element elem[VIRTQUEUE_MAX_SIZE];
	bool v6 = !(inany_v4(&toside->eaddr) && inany_v4(&toside->oaddr));
	static struct iovec iov_vu[VIRTQUEUE_MAX_SIZE];
	struct vu_dev *vdev = c->vdev;
	struct vu_virtq *vq = &vdev->vq[VHOST_USER_RX_QUEUE];
	size_t hdrlen = udp_vu_hdrlen(v6);
	int i;

	assert(!c->no_udp);

	if (!vu_queue_enabled(vq) || !vu_queue_started(vq)) {
		struct msghdr msg = { 0 };

		debug("Got UDP packet, but RX virtqueue not usable yet");

		for (i = 0; i < n; i++) {
			if (recvmsg(s, &msg, MSG_DONTWAIT) < 0)
				debug_perror("Failed to discard datagram");
		}

		return;
	}

	for (i = 0; i < n; i++) {
		unsigned elem_cnt, elem_used, j, k;
		size_t iov_cnt;
		ssize_t dlen;

		elem_cnt = vu_collect(vdev, vq, elem, ARRAY_SIZE(elem),
				      iov_vu, ARRAY_SIZE(iov_vu), &iov_cnt,
				      IP_MAX_MTU + ETH_HLEN + VNET_HLEN, NULL);
		if (elem_cnt == 0)
			break;

		dlen = udp_vu_sock_recv(iov_vu, &iov_cnt, s, v6);
		if (dlen < 0) {
			vu_queue_rewind(vq, elem_cnt);
			break;
		}

		elem_used = 0;
		for (j = 0, k = 0; k < iov_cnt && j < elem_cnt; j++) {
			if (k + elem[j].in_num > iov_cnt)
				elem[j].in_num = iov_cnt - k;
			k += elem[j].in_num;
			elem_used++;
		}

		/* release unused buffers */
		vu_queue_rewind(vq, elem_cnt - elem_used);

		if (iov_cnt > 0) {
			struct iov_tail data = IOV_TAIL(iov_vu, iov_cnt, VNET_HLEN);
			size_t l4len = udp_vu_prepare(c, &data, toside, dlen);
			if (*c->pcap) {
				udp_vu_csum(toside, &data, l4len);
				pcap_iov(iov_vu, iov_cnt, VNET_HLEN,
					 hdrlen + dlen - VNET_HLEN);
			}
			vu_pad(iov_vu, iov_cnt, hdrlen + dlen);
			vu_flush(vdev, vq, elem, elem_used, hdrlen + dlen);
			vu_queue_notify(vdev, vq);
		}
	}
}
debug log:

solving 5bc9509a1b98 ...
found 5bc9509a1b98 in https://archives.passt.top/passt-dev/20260401192326.1783350-4-lvivier@redhat.com/
found 5608a3a96ff5 in https://archives.passt.top/passt-dev/20260401192326.1783350-2-lvivier@redhat.com/
found 30af64034516 in https://archives.passt.top/passt-dev/20260401191826.1782394-11-lvivier@redhat.com/
found 4641f42eb5c4 in https://archives.passt.top/passt-dev/20260401191826.1782394-9-lvivier@redhat.com/
found 81491afa7e6a in https://archives.passt.top/passt-dev/20260401191826.1782394-8-lvivier@redhat.com/
found 5421a7d71a19 in https://archives.passt.top/passt-dev/20260401191826.1782394-7-lvivier@redhat.com/
found 9688fe1fdc5c in https://archives.passt.top/passt-dev/20260401191826.1782394-6-lvivier@redhat.com/
found 34f39e1256f8 in https://archives.passt.top/passt-dev/20260401191826.1782394-5-lvivier@redhat.com/
found f8629af58ab5 in https://archives.passt.top/passt-dev/20260401191826.1782394-4-lvivier@redhat.com/ ||
	https://archives.passt.top/passt-dev/20260327175834.831995-3-lvivier@redhat.com/
found cc69654398f0 in https://passt.top/passt
preparing index
index prepared:
100644 cc69654398f02b2b21b3d7f41eb12060e177a709	udp_vu.c

applying [1/10] https://archives.passt.top/passt-dev/20260401191826.1782394-4-lvivier@redhat.com/
diff --git a/udp_vu.c b/udp_vu.c
index cc69654398f0..f8629af58ab5 100644

Checking patch udp_vu.c...
Applied patch udp_vu.c cleanly.

skipping https://archives.passt.top/passt-dev/20260327175834.831995-3-lvivier@redhat.com/ for f8629af58ab5
index at:
100644 f8629af58ab54f9f9728b2364c5b31bb03bb681a	udp_vu.c

applying [2/10] https://archives.passt.top/passt-dev/20260401191826.1782394-5-lvivier@redhat.com/
diff --git a/udp_vu.c b/udp_vu.c
index f8629af58ab5..34f39e1256f8 100644


applying [3/10] https://archives.passt.top/passt-dev/20260401191826.1782394-6-lvivier@redhat.com/
diff --git a/udp_vu.c b/udp_vu.c
index 34f39e1256f8..9688fe1fdc5c 100644


applying [4/10] https://archives.passt.top/passt-dev/20260401191826.1782394-7-lvivier@redhat.com/
diff --git a/udp_vu.c b/udp_vu.c
index 9688fe1fdc5c..5421a7d71a19 100644


applying [5/10] https://archives.passt.top/passt-dev/20260401191826.1782394-8-lvivier@redhat.com/
diff --git a/udp_vu.c b/udp_vu.c
index 5421a7d71a19..81491afa7e6a 100644


applying [6/10] https://archives.passt.top/passt-dev/20260401191826.1782394-9-lvivier@redhat.com/
diff --git a/udp_vu.c b/udp_vu.c
index 81491afa7e6a..4641f42eb5c4 100644


applying [7/10] https://archives.passt.top/passt-dev/20260401191826.1782394-11-lvivier@redhat.com/
diff --git a/udp_vu.c b/udp_vu.c
index 4641f42eb5c4..30af64034516 100644


applying [8/10] https://archives.passt.top/passt-dev/20260401192326.1783350-2-lvivier@redhat.com/
diff --git a/udp_vu.c b/udp_vu.c
index 30af64034516..5608a3a96ff5 100644


applying [9/10] https://archives.passt.top/passt-dev/20260401192326.1783350-4-lvivier@redhat.com/
diff --git a/udp_vu.c b/udp_vu.c
index 5608a3a96ff5..5bc9509a1b98 100644

Checking patch udp_vu.c...
Applied patch udp_vu.c cleanly.
Checking patch udp_vu.c...
Applied patch udp_vu.c cleanly.
Checking patch udp_vu.c...
Applied patch udp_vu.c cleanly.
Checking patch udp_vu.c...
Applied patch udp_vu.c cleanly.
Checking patch udp_vu.c...
Applied patch udp_vu.c cleanly.
Checking patch udp_vu.c...
Applied patch udp_vu.c cleanly.
Checking patch udp_vu.c...
Applied patch udp_vu.c cleanly.
Checking patch udp_vu.c...
Applied patch udp_vu.c cleanly.

index at:
100644 5bc9509a1b980bbece49ba1e6a7b30dc313b49cc	udp_vu.c

Code repositories for project(s) associated with this public inbox

	https://passt.top/passt

This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for IMAP folder(s).