Loading...
1/*
2 * Copyright (C) 2001 - 2007 Jeff Dike (jdike@{addtoit,linux.intel}.com)
3 * Licensed under the GPL
4 */
5
6#include <stdio.h>
7#include <unistd.h>
8#include <stdarg.h>
9#include <errno.h>
10#include <stddef.h>
11#include <string.h>
12#include <sys/ioctl.h>
13#include <net/if.h>
14#include <linux/if_tun.h>
15#include <arpa/inet.h>
16#include <sys/types.h>
17#include <sys/stat.h>
18#include <fcntl.h>
19#include <sys/types.h>
20#include <sys/socket.h>
21#include <net/ethernet.h>
22#include <netinet/ip.h>
23#include <netinet/ether.h>
24#include <linux/if_ether.h>
25#include <linux/if_packet.h>
26#include <sys/socket.h>
27#include <sys/wait.h>
28#include <linux/virtio_net.h>
29#include <netdb.h>
30#include <stdlib.h>
31#include <os.h>
32#include <um_malloc.h>
33#include "vector_user.h"
34
35#define ID_GRE 0
36#define ID_L2TPV3 1
37#define ID_MAX 1
38
39#define TOKEN_IFNAME "ifname"
40
41#define TRANS_RAW "raw"
42#define TRANS_RAW_LEN strlen(TRANS_RAW)
43
44#define VNET_HDR_FAIL "could not enable vnet headers on fd %d"
45#define TUN_GET_F_FAIL "tapraw: TUNGETFEATURES failed: %s"
46#define L2TPV3_BIND_FAIL "l2tpv3_open : could not bind socket err=%i"
47#define BPF_ATTACH_FAIL "Failed to attach filter size %d to %d, err %d\n"
48
49/* This is very ugly and brute force lookup, but it is done
50 * only once at initialization so not worth doing hashes or
51 * anything more intelligent
52 */
53
54char *uml_vector_fetch_arg(struct arglist *ifspec, char *token)
55{
56 int i;
57
58 for (i = 0; i < ifspec->numargs; i++) {
59 if (strcmp(ifspec->tokens[i], token) == 0)
60 return ifspec->values[i];
61 }
62 return NULL;
63
64}
65
66struct arglist *uml_parse_vector_ifspec(char *arg)
67{
68 struct arglist *result;
69 int pos, len;
70 bool parsing_token = true, next_starts = true;
71
72 if (arg == NULL)
73 return NULL;
74 result = uml_kmalloc(sizeof(struct arglist), UM_GFP_KERNEL);
75 if (result == NULL)
76 return NULL;
77 result->numargs = 0;
78 len = strlen(arg);
79 for (pos = 0; pos < len; pos++) {
80 if (next_starts) {
81 if (parsing_token) {
82 result->tokens[result->numargs] = arg + pos;
83 } else {
84 result->values[result->numargs] = arg + pos;
85 result->numargs++;
86 }
87 next_starts = false;
88 }
89 if (*(arg + pos) == '=') {
90 if (parsing_token)
91 parsing_token = false;
92 else
93 goto cleanup;
94 next_starts = true;
95 (*(arg + pos)) = '\0';
96 }
97 if (*(arg + pos) == ',') {
98 parsing_token = true;
99 next_starts = true;
100 (*(arg + pos)) = '\0';
101 }
102 }
103 return result;
104cleanup:
105 printk(UM_KERN_ERR "vector_setup - Couldn't parse '%s'\n", arg);
106 kfree(result);
107 return NULL;
108}
109
110/*
111 * Socket/FD configuration functions. These return an structure
112 * of rx and tx descriptors to cover cases where these are not
113 * the same (f.e. read via raw socket and write via tap).
114 */
115
116#define PATH_NET_TUN "/dev/net/tun"
117
118static struct vector_fds *user_init_tap_fds(struct arglist *ifspec)
119{
120 struct ifreq ifr;
121 int fd = -1;
122 struct sockaddr_ll sock;
123 int err = -ENOMEM, offload;
124 char *iface;
125 struct vector_fds *result = NULL;
126
127 iface = uml_vector_fetch_arg(ifspec, TOKEN_IFNAME);
128 if (iface == NULL) {
129 printk(UM_KERN_ERR "uml_tap: failed to parse interface spec\n");
130 goto tap_cleanup;
131 }
132
133 result = uml_kmalloc(sizeof(struct vector_fds), UM_GFP_KERNEL);
134 if (result == NULL) {
135 printk(UM_KERN_ERR "uml_tap: failed to allocate file descriptors\n");
136 goto tap_cleanup;
137 }
138 result->rx_fd = -1;
139 result->tx_fd = -1;
140 result->remote_addr = NULL;
141 result->remote_addr_size = 0;
142
143 /* TAP */
144
145 fd = open(PATH_NET_TUN, O_RDWR);
146 if (fd < 0) {
147 printk(UM_KERN_ERR "uml_tap: failed to open tun device\n");
148 goto tap_cleanup;
149 }
150 result->tx_fd = fd;
151 memset(&ifr, 0, sizeof(ifr));
152 ifr.ifr_flags = IFF_TAP | IFF_NO_PI | IFF_VNET_HDR;
153 strncpy((char *)&ifr.ifr_name, iface, sizeof(ifr.ifr_name) - 1);
154
155 err = ioctl(fd, TUNSETIFF, (void *) &ifr);
156 if (err != 0) {
157 printk(UM_KERN_ERR "uml_tap: failed to select tap interface\n");
158 goto tap_cleanup;
159 }
160
161 offload = TUN_F_CSUM | TUN_F_TSO4 | TUN_F_TSO6;
162 ioctl(fd, TUNSETOFFLOAD, offload);
163
164 /* RAW */
165
166 fd = socket(AF_PACKET, SOCK_RAW, htons(ETH_P_ALL));
167 if (fd == -1) {
168 printk(UM_KERN_ERR
169 "uml_tap: failed to create socket: %i\n", -errno);
170 goto tap_cleanup;
171 }
172 result->rx_fd = fd;
173 memset(&ifr, 0, sizeof(ifr));
174 strncpy((char *)&ifr.ifr_name, iface, sizeof(ifr.ifr_name) - 1);
175 if (ioctl(fd, SIOCGIFINDEX, (void *) &ifr) < 0) {
176 printk(UM_KERN_ERR
177 "uml_tap: failed to set interface: %i\n", -errno);
178 goto tap_cleanup;
179 }
180
181 sock.sll_family = AF_PACKET;
182 sock.sll_protocol = htons(ETH_P_ALL);
183 sock.sll_ifindex = ifr.ifr_ifindex;
184
185 if (bind(fd,
186 (struct sockaddr *) &sock, sizeof(struct sockaddr_ll)) < 0) {
187 printk(UM_KERN_ERR
188 "user_init_tap: failed to bind raw pair, err %d\n",
189 -errno);
190 goto tap_cleanup;
191 }
192 return result;
193tap_cleanup:
194 printk(UM_KERN_ERR "user_init_tap: init failed, error %d", err);
195 if (result != NULL) {
196 if (result->rx_fd >= 0)
197 os_close_file(result->rx_fd);
198 if (result->tx_fd >= 0)
199 os_close_file(result->tx_fd);
200 kfree(result);
201 }
202 return NULL;
203}
204
205
206static struct vector_fds *user_init_raw_fds(struct arglist *ifspec)
207{
208 struct ifreq ifr;
209 int rxfd = -1, txfd = -1;
210 struct sockaddr_ll sock;
211 int err = -ENOMEM;
212 char *iface;
213 struct vector_fds *result = NULL;
214
215 iface = uml_vector_fetch_arg(ifspec, TOKEN_IFNAME);
216 if (iface == NULL)
217 goto cleanup;
218
219 rxfd = socket(AF_PACKET, SOCK_RAW, ETH_P_ALL);
220 if (rxfd == -1) {
221 err = -errno;
222 goto cleanup;
223 }
224 txfd = socket(AF_PACKET, SOCK_RAW, 0); /* Turn off RX on this fd */
225 if (txfd == -1) {
226 err = -errno;
227 goto cleanup;
228 }
229 memset(&ifr, 0, sizeof(ifr));
230 strncpy((char *)&ifr.ifr_name, iface, sizeof(ifr.ifr_name) - 1);
231 if (ioctl(rxfd, SIOCGIFINDEX, (void *) &ifr) < 0) {
232 err = -errno;
233 goto cleanup;
234 }
235
236 sock.sll_family = AF_PACKET;
237 sock.sll_protocol = htons(ETH_P_ALL);
238 sock.sll_ifindex = ifr.ifr_ifindex;
239
240 if (bind(rxfd,
241 (struct sockaddr *) &sock, sizeof(struct sockaddr_ll)) < 0) {
242 err = -errno;
243 goto cleanup;
244 }
245
246 sock.sll_family = AF_PACKET;
247 sock.sll_protocol = htons(ETH_P_IP);
248 sock.sll_ifindex = ifr.ifr_ifindex;
249
250 if (bind(txfd,
251 (struct sockaddr *) &sock, sizeof(struct sockaddr_ll)) < 0) {
252 err = -errno;
253 goto cleanup;
254 }
255
256 result = uml_kmalloc(sizeof(struct vector_fds), UM_GFP_KERNEL);
257 if (result != NULL) {
258 result->rx_fd = rxfd;
259 result->tx_fd = txfd;
260 result->remote_addr = NULL;
261 result->remote_addr_size = 0;
262 }
263 return result;
264cleanup:
265 printk(UM_KERN_ERR "user_init_raw: init failed, error %d", err);
266 if (rxfd >= 0)
267 os_close_file(rxfd);
268 if (txfd >= 0)
269 os_close_file(txfd);
270 if (result != NULL)
271 kfree(result);
272 return NULL;
273}
274
275
276bool uml_raw_enable_qdisc_bypass(int fd)
277{
278 int optval = 1;
279
280 if (setsockopt(fd,
281 SOL_PACKET, PACKET_QDISC_BYPASS,
282 &optval, sizeof(optval)) != 0) {
283 return false;
284 }
285 return true;
286}
287
288bool uml_raw_enable_vnet_headers(int fd)
289{
290 int optval = 1;
291
292 if (setsockopt(fd,
293 SOL_PACKET, PACKET_VNET_HDR,
294 &optval, sizeof(optval)) != 0) {
295 printk(UM_KERN_INFO VNET_HDR_FAIL, fd);
296 return false;
297 }
298 return true;
299}
300bool uml_tap_enable_vnet_headers(int fd)
301{
302 unsigned int features;
303 int len = sizeof(struct virtio_net_hdr);
304
305 if (ioctl(fd, TUNGETFEATURES, &features) == -1) {
306 printk(UM_KERN_INFO TUN_GET_F_FAIL, strerror(errno));
307 return false;
308 }
309 if ((features & IFF_VNET_HDR) == 0) {
310 printk(UM_KERN_INFO "tapraw: No VNET HEADER support");
311 return false;
312 }
313 ioctl(fd, TUNSETVNETHDRSZ, &len);
314 return true;
315}
316
317static struct vector_fds *user_init_socket_fds(struct arglist *ifspec, int id)
318{
319 int err = -ENOMEM;
320 int fd = -1, gairet;
321 struct addrinfo srchints;
322 struct addrinfo dsthints;
323 bool v6, udp;
324 char *value;
325 char *src, *dst, *srcport, *dstport;
326 struct addrinfo *gairesult = NULL;
327 struct vector_fds *result = NULL;
328
329
330 value = uml_vector_fetch_arg(ifspec, "v6");
331 v6 = false;
332 udp = false;
333 if (value != NULL) {
334 if (strtol((const char *) value, NULL, 10) > 0)
335 v6 = true;
336 }
337
338 value = uml_vector_fetch_arg(ifspec, "udp");
339 if (value != NULL) {
340 if (strtol((const char *) value, NULL, 10) > 0)
341 udp = true;
342 }
343 src = uml_vector_fetch_arg(ifspec, "src");
344 dst = uml_vector_fetch_arg(ifspec, "dst");
345 srcport = uml_vector_fetch_arg(ifspec, "srcport");
346 dstport = uml_vector_fetch_arg(ifspec, "dstport");
347
348 memset(&dsthints, 0, sizeof(dsthints));
349
350 if (v6)
351 dsthints.ai_family = AF_INET6;
352 else
353 dsthints.ai_family = AF_INET;
354
355 switch (id) {
356 case ID_GRE:
357 dsthints.ai_socktype = SOCK_RAW;
358 dsthints.ai_protocol = IPPROTO_GRE;
359 break;
360 case ID_L2TPV3:
361 if (udp) {
362 dsthints.ai_socktype = SOCK_DGRAM;
363 dsthints.ai_protocol = 0;
364 } else {
365 dsthints.ai_socktype = SOCK_RAW;
366 dsthints.ai_protocol = IPPROTO_L2TP;
367 }
368 break;
369 default:
370 printk(KERN_ERR "Unsupported socket type\n");
371 return NULL;
372 }
373 memcpy(&srchints, &dsthints, sizeof(struct addrinfo));
374
375 gairet = getaddrinfo(src, srcport, &dsthints, &gairesult);
376 if ((gairet != 0) || (gairesult == NULL)) {
377 printk(UM_KERN_ERR
378 "socket_open : could not resolve src, error = %s",
379 gai_strerror(gairet)
380 );
381 return NULL;
382 }
383 fd = socket(gairesult->ai_family,
384 gairesult->ai_socktype, gairesult->ai_protocol);
385 if (fd == -1) {
386 printk(UM_KERN_ERR
387 "socket_open : could not open socket, error = %d",
388 -errno
389 );
390 goto cleanup;
391 }
392 if (bind(fd,
393 (struct sockaddr *) gairesult->ai_addr,
394 gairesult->ai_addrlen)) {
395 printk(UM_KERN_ERR L2TPV3_BIND_FAIL, errno);
396 goto cleanup;
397 }
398
399 if (gairesult != NULL)
400 freeaddrinfo(gairesult);
401
402 gairesult = NULL;
403
404 gairet = getaddrinfo(dst, dstport, &dsthints, &gairesult);
405 if ((gairet != 0) || (gairesult == NULL)) {
406 printk(UM_KERN_ERR
407 "socket_open : could not resolve dst, error = %s",
408 gai_strerror(gairet)
409 );
410 return NULL;
411 }
412
413 result = uml_kmalloc(sizeof(struct vector_fds), UM_GFP_KERNEL);
414 if (result != NULL) {
415 result->rx_fd = fd;
416 result->tx_fd = fd;
417 result->remote_addr = uml_kmalloc(
418 gairesult->ai_addrlen, UM_GFP_KERNEL);
419 if (result->remote_addr == NULL)
420 goto cleanup;
421 result->remote_addr_size = gairesult->ai_addrlen;
422 memcpy(
423 result->remote_addr,
424 gairesult->ai_addr,
425 gairesult->ai_addrlen
426 );
427 }
428 freeaddrinfo(gairesult);
429 return result;
430cleanup:
431 if (gairesult != NULL)
432 freeaddrinfo(gairesult);
433 printk(UM_KERN_ERR "user_init_socket: init failed, error %d", err);
434 if (fd >= 0)
435 os_close_file(fd);
436 if (result != NULL) {
437 if (result->remote_addr != NULL)
438 kfree(result->remote_addr);
439 kfree(result);
440 }
441 return NULL;
442}
443
444struct vector_fds *uml_vector_user_open(
445 int unit,
446 struct arglist *parsed
447)
448{
449 char *transport;
450
451 if (parsed == NULL) {
452 printk(UM_KERN_ERR "no parsed config for unit %d\n", unit);
453 return NULL;
454 }
455 transport = uml_vector_fetch_arg(parsed, "transport");
456 if (transport == NULL) {
457 printk(UM_KERN_ERR "missing transport for unit %d\n", unit);
458 return NULL;
459 }
460 if (strncmp(transport, TRANS_RAW, TRANS_RAW_LEN) == 0)
461 return user_init_raw_fds(parsed);
462 if (strncmp(transport, TRANS_TAP, TRANS_TAP_LEN) == 0)
463 return user_init_tap_fds(parsed);
464 if (strncmp(transport, TRANS_GRE, TRANS_GRE_LEN) == 0)
465 return user_init_socket_fds(parsed, ID_GRE);
466 if (strncmp(transport, TRANS_L2TPV3, TRANS_L2TPV3_LEN) == 0)
467 return user_init_socket_fds(parsed, ID_L2TPV3);
468 return NULL;
469}
470
471
472int uml_vector_sendmsg(int fd, void *hdr, int flags)
473{
474 int n;
475
476 CATCH_EINTR(n = sendmsg(fd, (struct msghdr *) hdr, flags));
477 if ((n < 0) && (errno == EAGAIN))
478 return 0;
479 if (n >= 0)
480 return n;
481 else
482 return -errno;
483}
484
485int uml_vector_recvmsg(int fd, void *hdr, int flags)
486{
487 int n;
488
489 CATCH_EINTR(n = recvmsg(fd, (struct msghdr *) hdr, flags));
490 if ((n < 0) && (errno == EAGAIN))
491 return 0;
492 if (n >= 0)
493 return n;
494 else
495 return -errno;
496}
497
498int uml_vector_writev(int fd, void *hdr, int iovcount)
499{
500 int n;
501
502 CATCH_EINTR(n = writev(fd, (struct iovec *) hdr, iovcount));
503 if ((n < 0) && (errno == EAGAIN))
504 return 0;
505 if (n >= 0)
506 return n;
507 else
508 return -errno;
509}
510
511int uml_vector_sendmmsg(
512 int fd,
513 void *msgvec,
514 unsigned int vlen,
515 unsigned int flags)
516{
517 int n;
518
519 CATCH_EINTR(n = sendmmsg(fd, (struct mmsghdr *) msgvec, vlen, flags));
520 if ((n < 0) && (errno == EAGAIN))
521 return 0;
522 if (n >= 0)
523 return n;
524 else
525 return -errno;
526}
527
528int uml_vector_recvmmsg(
529 int fd,
530 void *msgvec,
531 unsigned int vlen,
532 unsigned int flags)
533{
534 int n;
535
536 CATCH_EINTR(
537 n = recvmmsg(fd, (struct mmsghdr *) msgvec, vlen, flags, 0));
538 if ((n < 0) && (errno == EAGAIN))
539 return 0;
540 if (n >= 0)
541 return n;
542 else
543 return -errno;
544}
545int uml_vector_attach_bpf(int fd, void *bpf, int bpf_len)
546{
547 int err = setsockopt(fd, SOL_SOCKET, SO_ATTACH_FILTER, bpf, bpf_len);
548
549 if (err < 0)
550 printk(KERN_ERR BPF_ATTACH_FAIL, bpf_len, fd, -errno);
551 return err;
552}
553
554#define DEFAULT_BPF_LEN 6
555
556void *uml_vector_default_bpf(int fd, void *mac)
557{
558 struct sock_filter *bpf;
559 uint32_t *mac1 = (uint32_t *)(mac + 2);
560 uint16_t *mac2 = (uint16_t *) mac;
561 struct sock_fprog bpf_prog = {
562 .len = 6,
563 .filter = NULL,
564 };
565
566 bpf = uml_kmalloc(
567 sizeof(struct sock_filter) * DEFAULT_BPF_LEN, UM_GFP_KERNEL);
568 if (bpf != NULL) {
569 bpf_prog.filter = bpf;
570 /* ld [8] */
571 bpf[0] = (struct sock_filter){ 0x20, 0, 0, 0x00000008 };
572 /* jeq #0xMAC[2-6] jt 2 jf 5*/
573 bpf[1] = (struct sock_filter){ 0x15, 0, 3, ntohl(*mac1)};
574 /* ldh [6] */
575 bpf[2] = (struct sock_filter){ 0x28, 0, 0, 0x00000006 };
576 /* jeq #0xMAC[0-1] jt 4 jf 5 */
577 bpf[3] = (struct sock_filter){ 0x15, 0, 1, ntohs(*mac2)};
578 /* ret #0 */
579 bpf[4] = (struct sock_filter){ 0x6, 0, 0, 0x00000000 };
580 /* ret #0x40000 */
581 bpf[5] = (struct sock_filter){ 0x6, 0, 0, 0x00040000 };
582 if (uml_vector_attach_bpf(
583 fd, &bpf_prog, sizeof(struct sock_fprog)) < 0) {
584 kfree(bpf);
585 bpf = NULL;
586 }
587 }
588 return bpf;
589}
590
1// SPDX-License-Identifier: GPL-2.0
2/*
3 * Copyright (C) 2001 - 2007 Jeff Dike (jdike@{addtoit,linux.intel}.com)
4 */
5
6#include <stdio.h>
7#include <unistd.h>
8#include <stdarg.h>
9#include <errno.h>
10#include <stddef.h>
11#include <string.h>
12#include <sys/ioctl.h>
13#include <net/if.h>
14#include <linux/if_tun.h>
15#include <arpa/inet.h>
16#include <sys/types.h>
17#include <sys/stat.h>
18#include <fcntl.h>
19#include <sys/socket.h>
20#include <sys/un.h>
21#include <net/ethernet.h>
22#include <netinet/ip.h>
23#include <netinet/ether.h>
24#include <linux/if_ether.h>
25#include <linux/if_packet.h>
26#include <sys/wait.h>
27#include <sys/uio.h>
28#include <linux/virtio_net.h>
29#include <netdb.h>
30#include <stdlib.h>
31#include <os.h>
32#include <um_malloc.h>
33#include "vector_user.h"
34
35#define ID_GRE 0
36#define ID_L2TPV3 1
37#define ID_BESS 2
38#define ID_MAX 2
39
40#define TOKEN_IFNAME "ifname"
41
42#define TRANS_RAW "raw"
43#define TRANS_RAW_LEN strlen(TRANS_RAW)
44
45#define VNET_HDR_FAIL "could not enable vnet headers on fd %d"
46#define TUN_GET_F_FAIL "tapraw: TUNGETFEATURES failed: %s"
47#define L2TPV3_BIND_FAIL "l2tpv3_open : could not bind socket err=%i"
48#define UNIX_BIND_FAIL "unix_open : could not bind socket err=%i"
49#define BPF_ATTACH_FAIL "Failed to attach filter size %d to %d, err %d\n"
50
51#define MAX_UN_LEN 107
52
53/* This is very ugly and brute force lookup, but it is done
54 * only once at initialization so not worth doing hashes or
55 * anything more intelligent
56 */
57
58char *uml_vector_fetch_arg(struct arglist *ifspec, char *token)
59{
60 int i;
61
62 for (i = 0; i < ifspec->numargs; i++) {
63 if (strcmp(ifspec->tokens[i], token) == 0)
64 return ifspec->values[i];
65 }
66 return NULL;
67
68}
69
70struct arglist *uml_parse_vector_ifspec(char *arg)
71{
72 struct arglist *result;
73 int pos, len;
74 bool parsing_token = true, next_starts = true;
75
76 if (arg == NULL)
77 return NULL;
78 result = uml_kmalloc(sizeof(struct arglist), UM_GFP_KERNEL);
79 if (result == NULL)
80 return NULL;
81 result->numargs = 0;
82 len = strlen(arg);
83 for (pos = 0; pos < len; pos++) {
84 if (next_starts) {
85 if (parsing_token) {
86 result->tokens[result->numargs] = arg + pos;
87 } else {
88 result->values[result->numargs] = arg + pos;
89 result->numargs++;
90 }
91 next_starts = false;
92 }
93 if (*(arg + pos) == '=') {
94 if (parsing_token)
95 parsing_token = false;
96 else
97 goto cleanup;
98 next_starts = true;
99 (*(arg + pos)) = '\0';
100 }
101 if (*(arg + pos) == ',') {
102 parsing_token = true;
103 next_starts = true;
104 (*(arg + pos)) = '\0';
105 }
106 }
107 return result;
108cleanup:
109 printk(UM_KERN_ERR "vector_setup - Couldn't parse '%s'\n", arg);
110 kfree(result);
111 return NULL;
112}
113
114/*
115 * Socket/FD configuration functions. These return an structure
116 * of rx and tx descriptors to cover cases where these are not
117 * the same (f.e. read via raw socket and write via tap).
118 */
119
120#define PATH_NET_TUN "/dev/net/tun"
121
122
123static int create_tap_fd(char *iface)
124{
125 struct ifreq ifr;
126 int fd = -1;
127 int err = -ENOMEM, offload;
128
129 fd = open(PATH_NET_TUN, O_RDWR);
130 if (fd < 0) {
131 printk(UM_KERN_ERR "uml_tap: failed to open tun device\n");
132 goto tap_fd_cleanup;
133 }
134 memset(&ifr, 0, sizeof(ifr));
135 ifr.ifr_flags = IFF_TAP | IFF_NO_PI | IFF_VNET_HDR;
136 strncpy((char *)&ifr.ifr_name, iface, sizeof(ifr.ifr_name) - 1);
137
138 err = ioctl(fd, TUNSETIFF, (void *) &ifr);
139 if (err != 0) {
140 printk(UM_KERN_ERR "uml_tap: failed to select tap interface\n");
141 goto tap_fd_cleanup;
142 }
143
144 offload = TUN_F_CSUM | TUN_F_TSO4 | TUN_F_TSO6;
145 ioctl(fd, TUNSETOFFLOAD, offload);
146 return fd;
147tap_fd_cleanup:
148 if (fd >= 0)
149 os_close_file(fd);
150 return err;
151}
152
153static int create_raw_fd(char *iface, int flags, int proto)
154{
155 struct ifreq ifr;
156 int fd = -1;
157 struct sockaddr_ll sock;
158 int err = -ENOMEM;
159
160 fd = socket(AF_PACKET, SOCK_RAW, flags);
161 if (fd == -1) {
162 err = -errno;
163 goto raw_fd_cleanup;
164 }
165 memset(&ifr, 0, sizeof(ifr));
166 strncpy((char *)&ifr.ifr_name, iface, sizeof(ifr.ifr_name) - 1);
167 if (ioctl(fd, SIOCGIFINDEX, (void *) &ifr) < 0) {
168 err = -errno;
169 goto raw_fd_cleanup;
170 }
171
172 sock.sll_family = AF_PACKET;
173 sock.sll_protocol = htons(proto);
174 sock.sll_ifindex = ifr.ifr_ifindex;
175
176 if (bind(fd,
177 (struct sockaddr *) &sock, sizeof(struct sockaddr_ll)) < 0) {
178 err = -errno;
179 goto raw_fd_cleanup;
180 }
181 return fd;
182raw_fd_cleanup:
183 printk(UM_KERN_ERR "user_init_raw: init failed, error %d", err);
184 if (fd >= 0)
185 os_close_file(fd);
186 return err;
187}
188
189static struct vector_fds *user_init_tap_fds(struct arglist *ifspec)
190{
191 int fd = -1;
192 char *iface;
193 struct vector_fds *result = NULL;
194
195 iface = uml_vector_fetch_arg(ifspec, TOKEN_IFNAME);
196 if (iface == NULL) {
197 printk(UM_KERN_ERR "uml_tap: failed to parse interface spec\n");
198 goto tap_cleanup;
199 }
200
201 result = uml_kmalloc(sizeof(struct vector_fds), UM_GFP_KERNEL);
202 if (result == NULL) {
203 printk(UM_KERN_ERR "uml_tap: failed to allocate file descriptors\n");
204 goto tap_cleanup;
205 }
206 result->rx_fd = -1;
207 result->tx_fd = -1;
208 result->remote_addr = NULL;
209 result->remote_addr_size = 0;
210
211 /* TAP */
212
213 fd = create_tap_fd(iface);
214 if (fd < 0) {
215 printk(UM_KERN_ERR "uml_tap: failed to create tun interface\n");
216 goto tap_cleanup;
217 }
218 result->tx_fd = fd;
219 result->rx_fd = fd;
220 return result;
221tap_cleanup:
222 printk(UM_KERN_ERR "user_init_tap: init failed, error %d", fd);
223 if (result != NULL)
224 kfree(result);
225 return NULL;
226}
227
228static struct vector_fds *user_init_hybrid_fds(struct arglist *ifspec)
229{
230 char *iface;
231 struct vector_fds *result = NULL;
232
233 iface = uml_vector_fetch_arg(ifspec, TOKEN_IFNAME);
234 if (iface == NULL) {
235 printk(UM_KERN_ERR "uml_tap: failed to parse interface spec\n");
236 goto hybrid_cleanup;
237 }
238
239 result = uml_kmalloc(sizeof(struct vector_fds), UM_GFP_KERNEL);
240 if (result == NULL) {
241 printk(UM_KERN_ERR "uml_tap: failed to allocate file descriptors\n");
242 goto hybrid_cleanup;
243 }
244 result->rx_fd = -1;
245 result->tx_fd = -1;
246 result->remote_addr = NULL;
247 result->remote_addr_size = 0;
248
249 /* TAP */
250
251 result->tx_fd = create_tap_fd(iface);
252 if (result->tx_fd < 0) {
253 printk(UM_KERN_ERR "uml_tap: failed to create tun interface: %i\n", result->tx_fd);
254 goto hybrid_cleanup;
255 }
256
257 /* RAW */
258
259 result->rx_fd = create_raw_fd(iface, ETH_P_ALL, ETH_P_ALL);
260 if (result->rx_fd == -1) {
261 printk(UM_KERN_ERR
262 "uml_tap: failed to create paired raw socket: %i\n", result->rx_fd);
263 goto hybrid_cleanup;
264 }
265 return result;
266hybrid_cleanup:
267 printk(UM_KERN_ERR "user_init_hybrid: init failed");
268 if (result != NULL)
269 kfree(result);
270 return NULL;
271}
272
273static struct vector_fds *user_init_unix_fds(struct arglist *ifspec, int id)
274{
275 int fd = -1;
276 int socktype;
277 char *src, *dst;
278 struct vector_fds *result = NULL;
279 struct sockaddr_un *local_addr = NULL, *remote_addr = NULL;
280
281 src = uml_vector_fetch_arg(ifspec, "src");
282 dst = uml_vector_fetch_arg(ifspec, "dst");
283 result = uml_kmalloc(sizeof(struct vector_fds), UM_GFP_KERNEL);
284 if (result == NULL) {
285 printk(UM_KERN_ERR "unix open:cannot allocate remote addr");
286 goto unix_cleanup;
287 }
288 remote_addr = uml_kmalloc(sizeof(struct sockaddr_un), UM_GFP_KERNEL);
289 if (remote_addr == NULL) {
290 printk(UM_KERN_ERR "unix open:cannot allocate remote addr");
291 goto unix_cleanup;
292 }
293
294 switch (id) {
295 case ID_BESS:
296 socktype = SOCK_SEQPACKET;
297 if ((src != NULL) && (strlen(src) <= MAX_UN_LEN)) {
298 local_addr = uml_kmalloc(sizeof(struct sockaddr_un), UM_GFP_KERNEL);
299 if (local_addr == NULL) {
300 printk(UM_KERN_ERR "bess open:cannot allocate local addr");
301 goto unix_cleanup;
302 }
303 local_addr->sun_family = AF_UNIX;
304 memcpy(local_addr->sun_path, src, strlen(src) + 1);
305 }
306 if ((dst == NULL) || (strlen(dst) > MAX_UN_LEN))
307 goto unix_cleanup;
308 remote_addr->sun_family = AF_UNIX;
309 memcpy(remote_addr->sun_path, dst, strlen(dst) + 1);
310 break;
311 default:
312 printk(KERN_ERR "Unsupported unix socket type\n");
313 return NULL;
314 }
315
316 fd = socket(AF_UNIX, socktype, 0);
317 if (fd == -1) {
318 printk(UM_KERN_ERR
319 "unix open: could not open socket, error = %d",
320 -errno
321 );
322 goto unix_cleanup;
323 }
324 if (local_addr != NULL) {
325 if (bind(fd, (struct sockaddr *) local_addr, sizeof(struct sockaddr_un))) {
326 printk(UM_KERN_ERR UNIX_BIND_FAIL, errno);
327 goto unix_cleanup;
328 }
329 }
330 switch (id) {
331 case ID_BESS:
332 if (connect(fd, remote_addr, sizeof(struct sockaddr_un)) < 0) {
333 printk(UM_KERN_ERR "bess open:cannot connect to %s %i", remote_addr->sun_path, -errno);
334 goto unix_cleanup;
335 }
336 break;
337 }
338 result->rx_fd = fd;
339 result->tx_fd = fd;
340 result->remote_addr_size = sizeof(struct sockaddr_un);
341 result->remote_addr = remote_addr;
342 return result;
343unix_cleanup:
344 if (fd >= 0)
345 os_close_file(fd);
346 if (remote_addr != NULL)
347 kfree(remote_addr);
348 if (result != NULL)
349 kfree(result);
350 return NULL;
351}
352
353static struct vector_fds *user_init_raw_fds(struct arglist *ifspec)
354{
355 int rxfd = -1, txfd = -1;
356 int err = -ENOMEM;
357 char *iface;
358 struct vector_fds *result = NULL;
359
360 iface = uml_vector_fetch_arg(ifspec, TOKEN_IFNAME);
361 if (iface == NULL)
362 goto raw_cleanup;
363
364 rxfd = create_raw_fd(iface, ETH_P_ALL, ETH_P_ALL);
365 if (rxfd == -1) {
366 err = -errno;
367 goto raw_cleanup;
368 }
369 txfd = create_raw_fd(iface, 0, ETH_P_IP); /* Turn off RX on this fd */
370 if (txfd == -1) {
371 err = -errno;
372 goto raw_cleanup;
373 }
374 result = uml_kmalloc(sizeof(struct vector_fds), UM_GFP_KERNEL);
375 if (result != NULL) {
376 result->rx_fd = rxfd;
377 result->tx_fd = txfd;
378 result->remote_addr = NULL;
379 result->remote_addr_size = 0;
380 }
381 return result;
382raw_cleanup:
383 printk(UM_KERN_ERR "user_init_raw: init failed, error %d", err);
384 if (result != NULL)
385 kfree(result);
386 return NULL;
387}
388
389
390bool uml_raw_enable_qdisc_bypass(int fd)
391{
392 int optval = 1;
393
394 if (setsockopt(fd,
395 SOL_PACKET, PACKET_QDISC_BYPASS,
396 &optval, sizeof(optval)) != 0) {
397 return false;
398 }
399 return true;
400}
401
402bool uml_raw_enable_vnet_headers(int fd)
403{
404 int optval = 1;
405
406 if (setsockopt(fd,
407 SOL_PACKET, PACKET_VNET_HDR,
408 &optval, sizeof(optval)) != 0) {
409 printk(UM_KERN_INFO VNET_HDR_FAIL, fd);
410 return false;
411 }
412 return true;
413}
414bool uml_tap_enable_vnet_headers(int fd)
415{
416 unsigned int features;
417 int len = sizeof(struct virtio_net_hdr);
418
419 if (ioctl(fd, TUNGETFEATURES, &features) == -1) {
420 printk(UM_KERN_INFO TUN_GET_F_FAIL, strerror(errno));
421 return false;
422 }
423 if ((features & IFF_VNET_HDR) == 0) {
424 printk(UM_KERN_INFO "tapraw: No VNET HEADER support");
425 return false;
426 }
427 ioctl(fd, TUNSETVNETHDRSZ, &len);
428 return true;
429}
430
431static struct vector_fds *user_init_socket_fds(struct arglist *ifspec, int id)
432{
433 int err = -ENOMEM;
434 int fd = -1, gairet;
435 struct addrinfo srchints;
436 struct addrinfo dsthints;
437 bool v6, udp;
438 char *value;
439 char *src, *dst, *srcport, *dstport;
440 struct addrinfo *gairesult = NULL;
441 struct vector_fds *result = NULL;
442
443
444 value = uml_vector_fetch_arg(ifspec, "v6");
445 v6 = false;
446 udp = false;
447 if (value != NULL) {
448 if (strtol((const char *) value, NULL, 10) > 0)
449 v6 = true;
450 }
451
452 value = uml_vector_fetch_arg(ifspec, "udp");
453 if (value != NULL) {
454 if (strtol((const char *) value, NULL, 10) > 0)
455 udp = true;
456 }
457 src = uml_vector_fetch_arg(ifspec, "src");
458 dst = uml_vector_fetch_arg(ifspec, "dst");
459 srcport = uml_vector_fetch_arg(ifspec, "srcport");
460 dstport = uml_vector_fetch_arg(ifspec, "dstport");
461
462 memset(&dsthints, 0, sizeof(dsthints));
463
464 if (v6)
465 dsthints.ai_family = AF_INET6;
466 else
467 dsthints.ai_family = AF_INET;
468
469 switch (id) {
470 case ID_GRE:
471 dsthints.ai_socktype = SOCK_RAW;
472 dsthints.ai_protocol = IPPROTO_GRE;
473 break;
474 case ID_L2TPV3:
475 if (udp) {
476 dsthints.ai_socktype = SOCK_DGRAM;
477 dsthints.ai_protocol = 0;
478 } else {
479 dsthints.ai_socktype = SOCK_RAW;
480 dsthints.ai_protocol = IPPROTO_L2TP;
481 }
482 break;
483 default:
484 printk(KERN_ERR "Unsupported socket type\n");
485 return NULL;
486 }
487 memcpy(&srchints, &dsthints, sizeof(struct addrinfo));
488
489 gairet = getaddrinfo(src, srcport, &dsthints, &gairesult);
490 if ((gairet != 0) || (gairesult == NULL)) {
491 printk(UM_KERN_ERR
492 "socket_open : could not resolve src, error = %s",
493 gai_strerror(gairet)
494 );
495 return NULL;
496 }
497 fd = socket(gairesult->ai_family,
498 gairesult->ai_socktype, gairesult->ai_protocol);
499 if (fd == -1) {
500 printk(UM_KERN_ERR
501 "socket_open : could not open socket, error = %d",
502 -errno
503 );
504 goto cleanup;
505 }
506 if (bind(fd,
507 (struct sockaddr *) gairesult->ai_addr,
508 gairesult->ai_addrlen)) {
509 printk(UM_KERN_ERR L2TPV3_BIND_FAIL, errno);
510 goto cleanup;
511 }
512
513 if (gairesult != NULL)
514 freeaddrinfo(gairesult);
515
516 gairesult = NULL;
517
518 gairet = getaddrinfo(dst, dstport, &dsthints, &gairesult);
519 if ((gairet != 0) || (gairesult == NULL)) {
520 printk(UM_KERN_ERR
521 "socket_open : could not resolve dst, error = %s",
522 gai_strerror(gairet)
523 );
524 return NULL;
525 }
526
527 result = uml_kmalloc(sizeof(struct vector_fds), UM_GFP_KERNEL);
528 if (result != NULL) {
529 result->rx_fd = fd;
530 result->tx_fd = fd;
531 result->remote_addr = uml_kmalloc(
532 gairesult->ai_addrlen, UM_GFP_KERNEL);
533 if (result->remote_addr == NULL)
534 goto cleanup;
535 result->remote_addr_size = gairesult->ai_addrlen;
536 memcpy(
537 result->remote_addr,
538 gairesult->ai_addr,
539 gairesult->ai_addrlen
540 );
541 }
542 freeaddrinfo(gairesult);
543 return result;
544cleanup:
545 if (gairesult != NULL)
546 freeaddrinfo(gairesult);
547 printk(UM_KERN_ERR "user_init_socket: init failed, error %d", err);
548 if (fd >= 0)
549 os_close_file(fd);
550 if (result != NULL) {
551 kfree(result->remote_addr);
552 kfree(result);
553 }
554 return NULL;
555}
556
557struct vector_fds *uml_vector_user_open(
558 int unit,
559 struct arglist *parsed
560)
561{
562 char *transport;
563
564 if (parsed == NULL) {
565 printk(UM_KERN_ERR "no parsed config for unit %d\n", unit);
566 return NULL;
567 }
568 transport = uml_vector_fetch_arg(parsed, "transport");
569 if (transport == NULL) {
570 printk(UM_KERN_ERR "missing transport for unit %d\n", unit);
571 return NULL;
572 }
573 if (strncmp(transport, TRANS_RAW, TRANS_RAW_LEN) == 0)
574 return user_init_raw_fds(parsed);
575 if (strncmp(transport, TRANS_HYBRID, TRANS_HYBRID_LEN) == 0)
576 return user_init_hybrid_fds(parsed);
577 if (strncmp(transport, TRANS_TAP, TRANS_TAP_LEN) == 0)
578 return user_init_tap_fds(parsed);
579 if (strncmp(transport, TRANS_GRE, TRANS_GRE_LEN) == 0)
580 return user_init_socket_fds(parsed, ID_GRE);
581 if (strncmp(transport, TRANS_L2TPV3, TRANS_L2TPV3_LEN) == 0)
582 return user_init_socket_fds(parsed, ID_L2TPV3);
583 if (strncmp(transport, TRANS_BESS, TRANS_BESS_LEN) == 0)
584 return user_init_unix_fds(parsed, ID_BESS);
585 return NULL;
586}
587
588
589int uml_vector_sendmsg(int fd, void *hdr, int flags)
590{
591 int n;
592
593 CATCH_EINTR(n = sendmsg(fd, (struct msghdr *) hdr, flags));
594 if ((n < 0) && (errno == EAGAIN))
595 return 0;
596 if (n >= 0)
597 return n;
598 else
599 return -errno;
600}
601
602int uml_vector_recvmsg(int fd, void *hdr, int flags)
603{
604 int n;
605 struct msghdr *msg = (struct msghdr *) hdr;
606
607 CATCH_EINTR(n = readv(fd, msg->msg_iov, msg->msg_iovlen));
608 if ((n < 0) && (errno == EAGAIN))
609 return 0;
610 if (n >= 0)
611 return n;
612 else
613 return -errno;
614}
615
616int uml_vector_writev(int fd, void *hdr, int iovcount)
617{
618 int n;
619
620 CATCH_EINTR(n = writev(fd, (struct iovec *) hdr, iovcount));
621 if ((n < 0) && ((errno == EAGAIN) || (errno == ENOBUFS)))
622 return 0;
623 if (n >= 0)
624 return n;
625 else
626 return -errno;
627}
628
629int uml_vector_sendmmsg(
630 int fd,
631 void *msgvec,
632 unsigned int vlen,
633 unsigned int flags)
634{
635 int n;
636
637 CATCH_EINTR(n = sendmmsg(fd, (struct mmsghdr *) msgvec, vlen, flags));
638 if ((n < 0) && ((errno == EAGAIN) || (errno == ENOBUFS)))
639 return 0;
640 if (n >= 0)
641 return n;
642 else
643 return -errno;
644}
645
646int uml_vector_recvmmsg(
647 int fd,
648 void *msgvec,
649 unsigned int vlen,
650 unsigned int flags)
651{
652 int n;
653
654 CATCH_EINTR(
655 n = recvmmsg(fd, (struct mmsghdr *) msgvec, vlen, flags, 0));
656 if ((n < 0) && (errno == EAGAIN))
657 return 0;
658 if (n >= 0)
659 return n;
660 else
661 return -errno;
662}
663int uml_vector_attach_bpf(int fd, void *bpf, int bpf_len)
664{
665 int err = setsockopt(fd, SOL_SOCKET, SO_ATTACH_FILTER, bpf, bpf_len);
666
667 if (err < 0)
668 printk(KERN_ERR BPF_ATTACH_FAIL, bpf_len, fd, -errno);
669 return err;
670}
671
672#define DEFAULT_BPF_LEN 6
673
674void *uml_vector_default_bpf(int fd, void *mac)
675{
676 struct sock_filter *bpf;
677 uint32_t *mac1 = (uint32_t *)(mac + 2);
678 uint16_t *mac2 = (uint16_t *) mac;
679 struct sock_fprog bpf_prog = {
680 .len = 6,
681 .filter = NULL,
682 };
683
684 bpf = uml_kmalloc(
685 sizeof(struct sock_filter) * DEFAULT_BPF_LEN, UM_GFP_KERNEL);
686 if (bpf != NULL) {
687 bpf_prog.filter = bpf;
688 /* ld [8] */
689 bpf[0] = (struct sock_filter){ 0x20, 0, 0, 0x00000008 };
690 /* jeq #0xMAC[2-6] jt 2 jf 5*/
691 bpf[1] = (struct sock_filter){ 0x15, 0, 3, ntohl(*mac1)};
692 /* ldh [6] */
693 bpf[2] = (struct sock_filter){ 0x28, 0, 0, 0x00000006 };
694 /* jeq #0xMAC[0-1] jt 4 jf 5 */
695 bpf[3] = (struct sock_filter){ 0x15, 0, 1, ntohs(*mac2)};
696 /* ret #0 */
697 bpf[4] = (struct sock_filter){ 0x6, 0, 0, 0x00000000 };
698 /* ret #0x40000 */
699 bpf[5] = (struct sock_filter){ 0x6, 0, 0, 0x00040000 };
700 if (uml_vector_attach_bpf(
701 fd, &bpf_prog, sizeof(struct sock_fprog)) < 0) {
702 kfree(bpf);
703 bpf = NULL;
704 }
705 }
706 return bpf;
707}
708