blob: a2a92356c1a017ae0270e4d4ee8c8b665969c788 [file] [log] [blame]
Mark McLoughlin966ea5e2009-10-22 17:49:09 +01001/*
2 * QEMU System Emulator
3 *
4 * Copyright (c) 2003-2008 Fabrice Bellard
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24
Peter Maydell2744d922016-01-29 17:50:00 +000025#include "qemu/osdep.h"
Markus Armbrusterda34e652016-03-14 09:01:28 +010026#include "qapi/error.h"
Paolo Bonzini1422e322012-10-24 08:43:34 +020027#include "tap_int.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010028#include "sysemu/sysemu.h"
Veronia Bahaaf348b6d2016-03-20 19:16:19 +020029#include "qemu/cutils.h"
Mark McLoughlin966ea5e2009-10-22 17:49:09 +010030
Mark McLoughlin966ea5e2009-10-22 17:49:09 +010031#include <sys/ethernet.h>
32#include <sys/sockio.h>
33#include <netinet/arp.h>
34#include <netinet/in.h>
35#include <netinet/in_systm.h>
36#include <netinet/ip.h>
37#include <netinet/ip_icmp.h> // must come after ip.h
38#include <netinet/udp.h>
39#include <netinet/tcp.h>
40#include <net/if.h>
Mark McLoughlin966ea5e2009-10-22 17:49:09 +010041#include <stropts.h>
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010042#include "qemu/error-report.h"
Mark McLoughlin966ea5e2009-10-22 17:49:09 +010043
44ssize_t tap_read_packet(int tapfd, uint8_t *buf, int maxlen)
45{
46 struct strbuf sbuf;
47 int f = 0;
48
49 sbuf.maxlen = maxlen;
50 sbuf.buf = (char *)buf;
51
52 return getmsg(tapfd, NULL, &sbuf, &f) >= 0 ? sbuf.len : -1;
53}
54
55#define TUNNEWPPA (('T'<<16) | 0x0001)
56/*
57 * Allocate TAP device, returns opened fd.
58 * Stores dev name in the first arg(must be large enough).
59 */
Markus Armbruster576c6eb2015-05-15 13:59:01 +020060static int tap_alloc(char *dev, size_t dev_size, Error **errp)
Mark McLoughlin966ea5e2009-10-22 17:49:09 +010061{
Markus Armbruster576c6eb2015-05-15 13:59:01 +020062 /* FIXME leaks like a sieve on error paths */
63 /* FIXME suspicious: many errors are reported, then ignored */
Mark McLoughlin966ea5e2009-10-22 17:49:09 +010064 int tap_fd, if_fd, ppa = -1;
65 static int ip_fd = 0;
66 char *ptr;
67
68 static int arp_fd = 0;
69 int ip_muxid, arp_muxid;
70 struct strioctl strioc_if, strioc_ppa;
Dong Xu Wang3a931132011-11-29 16:52:38 +080071 int link_type = I_PLINK;
Mark McLoughlin966ea5e2009-10-22 17:49:09 +010072 struct lifreq ifr;
73 char actual_name[32] = "";
74
75 memset(&ifr, 0x0, sizeof(ifr));
76
77 if( *dev ){
78 ptr = dev;
79 while( *ptr && !qemu_isdigit((int)*ptr) ) ptr++;
80 ppa = atoi(ptr);
81 }
82
83 /* Check if IP device was opened */
84 if( ip_fd )
85 close(ip_fd);
86
87 TFR(ip_fd = open("/dev/udp", O_RDWR, 0));
88 if (ip_fd < 0) {
Markus Armbruster576c6eb2015-05-15 13:59:01 +020089 error_setg(errp, "Can't open /dev/ip (actually /dev/udp)");
90 return -1;
Mark McLoughlin966ea5e2009-10-22 17:49:09 +010091 }
92
93 TFR(tap_fd = open("/dev/tap", O_RDWR, 0));
94 if (tap_fd < 0) {
Markus Armbruster576c6eb2015-05-15 13:59:01 +020095 error_setg(errp, "Can't open /dev/tap");
96 return -1;
Mark McLoughlin966ea5e2009-10-22 17:49:09 +010097 }
98
99 /* Assign a new PPA and get its unit number. */
100 strioc_ppa.ic_cmd = TUNNEWPPA;
101 strioc_ppa.ic_timout = 0;
102 strioc_ppa.ic_len = sizeof(ppa);
103 strioc_ppa.ic_dp = (char *)&ppa;
104 if ((ppa = ioctl (tap_fd, I_STR, &strioc_ppa)) < 0)
Markus Armbruster576c6eb2015-05-15 13:59:01 +0200105 error_report("Can't assign new interface");
Mark McLoughlin966ea5e2009-10-22 17:49:09 +0100106
107 TFR(if_fd = open("/dev/tap", O_RDWR, 0));
108 if (if_fd < 0) {
Markus Armbruster576c6eb2015-05-15 13:59:01 +0200109 error_setg(errp, "Can't open /dev/tap (2)");
110 return -1;
Mark McLoughlin966ea5e2009-10-22 17:49:09 +0100111 }
112 if(ioctl(if_fd, I_PUSH, "ip") < 0){
Markus Armbruster576c6eb2015-05-15 13:59:01 +0200113 error_setg(errp, "Can't push IP module");
114 return -1;
Mark McLoughlin966ea5e2009-10-22 17:49:09 +0100115 }
116
117 if (ioctl(if_fd, SIOCGLIFFLAGS, &ifr) < 0)
Markus Armbruster576c6eb2015-05-15 13:59:01 +0200118 error_report("Can't get flags");
Mark McLoughlin966ea5e2009-10-22 17:49:09 +0100119
120 snprintf (actual_name, 32, "tap%d", ppa);
121 pstrcpy(ifr.lifr_name, sizeof(ifr.lifr_name), actual_name);
122
123 ifr.lifr_ppa = ppa;
124 /* Assign ppa according to the unit number returned by tun device */
125
126 if (ioctl (if_fd, SIOCSLIFNAME, &ifr) < 0)
Markus Armbruster576c6eb2015-05-15 13:59:01 +0200127 error_report("Can't set PPA %d", ppa);
Mark McLoughlin966ea5e2009-10-22 17:49:09 +0100128 if (ioctl(if_fd, SIOCGLIFFLAGS, &ifr) <0)
Markus Armbruster576c6eb2015-05-15 13:59:01 +0200129 error_report("Can't get flags");
Mark McLoughlin966ea5e2009-10-22 17:49:09 +0100130 /* Push arp module to if_fd */
131 if (ioctl (if_fd, I_PUSH, "arp") < 0)
Markus Armbruster576c6eb2015-05-15 13:59:01 +0200132 error_report("Can't push ARP module (2)");
Mark McLoughlin966ea5e2009-10-22 17:49:09 +0100133
134 /* Push arp module to ip_fd */
135 if (ioctl (ip_fd, I_POP, NULL) < 0)
Markus Armbruster576c6eb2015-05-15 13:59:01 +0200136 error_report("I_POP failed");
Mark McLoughlin966ea5e2009-10-22 17:49:09 +0100137 if (ioctl (ip_fd, I_PUSH, "arp") < 0)
Markus Armbruster576c6eb2015-05-15 13:59:01 +0200138 error_report("Can't push ARP module (3)");
Mark McLoughlin966ea5e2009-10-22 17:49:09 +0100139 /* Open arp_fd */
140 TFR(arp_fd = open ("/dev/tap", O_RDWR, 0));
141 if (arp_fd < 0)
Markus Armbruster576c6eb2015-05-15 13:59:01 +0200142 error_report("Can't open %s", "/dev/tap");
Mark McLoughlin966ea5e2009-10-22 17:49:09 +0100143
144 /* Set ifname to arp */
145 strioc_if.ic_cmd = SIOCSLIFNAME;
146 strioc_if.ic_timout = 0;
147 strioc_if.ic_len = sizeof(ifr);
148 strioc_if.ic_dp = (char *)&ifr;
149 if (ioctl(arp_fd, I_STR, &strioc_if) < 0){
Markus Armbruster576c6eb2015-05-15 13:59:01 +0200150 error_report("Can't set ifname to arp");
Mark McLoughlin966ea5e2009-10-22 17:49:09 +0100151 }
152
153 if((ip_muxid = ioctl(ip_fd, I_LINK, if_fd)) < 0){
Markus Armbruster576c6eb2015-05-15 13:59:01 +0200154 error_setg(errp, "Can't link TAP device to IP");
155 return -1;
Mark McLoughlin966ea5e2009-10-22 17:49:09 +0100156 }
157
158 if ((arp_muxid = ioctl (ip_fd, link_type, arp_fd)) < 0)
Markus Armbruster576c6eb2015-05-15 13:59:01 +0200159 error_report("Can't link TAP device to ARP");
Mark McLoughlin966ea5e2009-10-22 17:49:09 +0100160
161 close (if_fd);
162
163 memset(&ifr, 0x0, sizeof(ifr));
164 pstrcpy(ifr.lifr_name, sizeof(ifr.lifr_name), actual_name);
165 ifr.lifr_ip_muxid = ip_muxid;
166 ifr.lifr_arp_muxid = arp_muxid;
167
168 if (ioctl (ip_fd, SIOCSLIFMUXID, &ifr) < 0)
169 {
170 ioctl (ip_fd, I_PUNLINK , arp_muxid);
171 ioctl (ip_fd, I_PUNLINK, ip_muxid);
Markus Armbruster576c6eb2015-05-15 13:59:01 +0200172 error_report("Can't set multiplexor id");
Mark McLoughlin966ea5e2009-10-22 17:49:09 +0100173 }
174
175 snprintf(dev, dev_size, "tap%d", ppa);
176 return tap_fd;
177}
178
Jason Wang264986e2013-01-30 19:12:34 +0800179int tap_open(char *ifname, int ifname_size, int *vnet_hdr,
Markus Armbruster468dd822015-05-15 13:58:58 +0200180 int vnet_hdr_required, int mq_required, Error **errp)
Mark McLoughlin966ea5e2009-10-22 17:49:09 +0100181{
182 char dev[10]="";
183 int fd;
Markus Armbruster576c6eb2015-05-15 13:59:01 +0200184
185 fd = tap_alloc(dev, sizeof(dev), errp);
186 if (fd < 0) {
187 return -1;
Mark McLoughlin966ea5e2009-10-22 17:49:09 +0100188 }
189 pstrcpy(ifname, ifname_size, dev);
Mark McLoughlinf5c5e382009-11-25 18:49:37 +0000190 if (*vnet_hdr) {
191 /* Solaris doesn't have IFF_VNET_HDR */
192 *vnet_hdr = 0;
193
194 if (vnet_hdr_required && !*vnet_hdr) {
Markus Armbruster576c6eb2015-05-15 13:59:01 +0200195 error_setg(errp, "vnet_hdr=1 requested, but no kernel "
196 "support for IFF_VNET_HDR available");
Mark McLoughlinf5c5e382009-11-25 18:49:37 +0000197 close(fd);
198 return -1;
199 }
200 }
Mark McLoughlin966ea5e2009-10-22 17:49:09 +0100201 fcntl(fd, F_SETFL, O_NONBLOCK);
202 return fd;
203}
Mark McLoughlin15ac9132009-10-22 17:49:13 +0100204
Markus Armbruster80b832c2015-05-15 13:58:55 +0200205void tap_set_sndbuf(int fd, const NetdevTapOptions *tap, Error **errp)
Mark McLoughlin15ac9132009-10-22 17:49:13 +0100206{
Mark McLoughlin15ac9132009-10-22 17:49:13 +0100207}
Mark McLoughlindc690042009-10-22 17:49:14 +0100208
209int tap_probe_vnet_hdr(int fd)
210{
211 return 0;
212}
Mark McLoughlin1faac1f2009-10-22 17:49:15 +0100213
Mark McLoughlin9c282712009-10-22 17:49:16 +0100214int tap_probe_has_ufo(int fd)
215{
216 return 0;
217}
218
Michael S. Tsirkin445d8922010-07-16 11:16:06 +0300219int tap_probe_vnet_hdr_len(int fd, int len)
220{
221 return 0;
222}
223
224void tap_fd_set_vnet_hdr_len(int fd, int len)
225{
226}
227
Michael S. Tsirkin4ee9b432015-06-18 16:52:23 +0200228int tap_fd_set_vnet_le(int fd, int is_le)
229{
230 return -EINVAL;
231}
232
233int tap_fd_set_vnet_be(int fd, int is_be)
234{
235 return -EINVAL;
236}
237
Mark McLoughlin1faac1f2009-10-22 17:49:15 +0100238void tap_fd_set_offload(int fd, int csum, int tso4,
239 int tso6, int ecn, int ufo)
240{
241}
Jason Wang94fdc6d2013-01-30 19:12:31 +0800242
243int tap_fd_enable(int fd)
244{
245 return -1;
246}
247
248int tap_fd_disable(int fd)
249{
250 return -1;
251}
252
Jason Wange5dc0b42013-01-30 19:12:33 +0800253int tap_fd_get_ifname(int fd, char *ifname)
254{
255 return -1;
256}