Statistics
| Branch: | Revision:

root / net / tap.c @ 9bf0960a

History | View | Annotate | Download (13.5 kB)

1 5281d757 Mark McLoughlin
/*
2 5281d757 Mark McLoughlin
 * QEMU System Emulator
3 5281d757 Mark McLoughlin
 *
4 5281d757 Mark McLoughlin
 * Copyright (c) 2003-2008 Fabrice Bellard
5 5281d757 Mark McLoughlin
 * Copyright (c) 2009 Red Hat, Inc.
6 5281d757 Mark McLoughlin
 *
7 5281d757 Mark McLoughlin
 * Permission is hereby granted, free of charge, to any person obtaining a copy
8 5281d757 Mark McLoughlin
 * of this software and associated documentation files (the "Software"), to deal
9 5281d757 Mark McLoughlin
 * in the Software without restriction, including without limitation the rights
10 5281d757 Mark McLoughlin
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
11 5281d757 Mark McLoughlin
 * copies of the Software, and to permit persons to whom the Software is
12 5281d757 Mark McLoughlin
 * furnished to do so, subject to the following conditions:
13 5281d757 Mark McLoughlin
 *
14 5281d757 Mark McLoughlin
 * The above copyright notice and this permission notice shall be included in
15 5281d757 Mark McLoughlin
 * all copies or substantial portions of the Software.
16 5281d757 Mark McLoughlin
 *
17 5281d757 Mark McLoughlin
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18 5281d757 Mark McLoughlin
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 5281d757 Mark McLoughlin
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20 5281d757 Mark McLoughlin
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21 5281d757 Mark McLoughlin
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
22 5281d757 Mark McLoughlin
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
23 5281d757 Mark McLoughlin
 * THE SOFTWARE.
24 5281d757 Mark McLoughlin
 */
25 5281d757 Mark McLoughlin
26 5281d757 Mark McLoughlin
#include "net/tap.h"
27 5281d757 Mark McLoughlin
28 5281d757 Mark McLoughlin
#include "config-host.h"
29 5281d757 Mark McLoughlin
30 5281d757 Mark McLoughlin
#include <sys/ioctl.h>
31 5281d757 Mark McLoughlin
#include <sys/stat.h>
32 5281d757 Mark McLoughlin
#include <sys/wait.h>
33 71f4effc Alexander Graf
#include <sys/socket.h>
34 5281d757 Mark McLoughlin
#include <net/if.h>
35 5281d757 Mark McLoughlin
36 5281d757 Mark McLoughlin
#include "net.h"
37 5281d757 Mark McLoughlin
#include "sysemu.h"
38 5281d757 Mark McLoughlin
#include "qemu-char.h"
39 5281d757 Mark McLoughlin
#include "qemu-common.h"
40 2f792016 Markus Armbruster
#include "qemu-error.h"
41 5281d757 Mark McLoughlin
42 5281d757 Mark McLoughlin
#include "net/tap-linux.h"
43 5281d757 Mark McLoughlin
44 82b0d80e Michael S. Tsirkin
#include "hw/vhost_net.h"
45 82b0d80e Michael S. Tsirkin
46 5281d757 Mark McLoughlin
/* Maximum GSO packet size (64k) plus plenty of room for
47 5281d757 Mark McLoughlin
 * the ethernet and virtio_net headers
48 5281d757 Mark McLoughlin
 */
49 5281d757 Mark McLoughlin
#define TAP_BUFSIZE (4096 + 65536)
50 5281d757 Mark McLoughlin
51 5281d757 Mark McLoughlin
typedef struct TAPState {
52 3e35ba93 Mark McLoughlin
    VLANClientState nc;
53 5281d757 Mark McLoughlin
    int fd;
54 5281d757 Mark McLoughlin
    char down_script[1024];
55 5281d757 Mark McLoughlin
    char down_script_arg[128];
56 5281d757 Mark McLoughlin
    uint8_t buf[TAP_BUFSIZE];
57 5281d757 Mark McLoughlin
    unsigned int read_poll : 1;
58 5281d757 Mark McLoughlin
    unsigned int write_poll : 1;
59 5281d757 Mark McLoughlin
    unsigned int using_vnet_hdr : 1;
60 5281d757 Mark McLoughlin
    unsigned int has_ufo: 1;
61 82b0d80e Michael S. Tsirkin
    VHostNetState *vhost_net;
62 ef4252b1 Michael S. Tsirkin
    unsigned host_vnet_hdr_len;
63 5281d757 Mark McLoughlin
} TAPState;
64 5281d757 Mark McLoughlin
65 5281d757 Mark McLoughlin
static int launch_script(const char *setup_script, const char *ifname, int fd);
66 5281d757 Mark McLoughlin
67 5281d757 Mark McLoughlin
static int tap_can_send(void *opaque);
68 5281d757 Mark McLoughlin
static void tap_send(void *opaque);
69 5281d757 Mark McLoughlin
static void tap_writable(void *opaque);
70 5281d757 Mark McLoughlin
71 5281d757 Mark McLoughlin
static void tap_update_fd_handler(TAPState *s)
72 5281d757 Mark McLoughlin
{
73 5281d757 Mark McLoughlin
    qemu_set_fd_handler2(s->fd,
74 5281d757 Mark McLoughlin
                         s->read_poll  ? tap_can_send : NULL,
75 5281d757 Mark McLoughlin
                         s->read_poll  ? tap_send     : NULL,
76 5281d757 Mark McLoughlin
                         s->write_poll ? tap_writable : NULL,
77 5281d757 Mark McLoughlin
                         s);
78 5281d757 Mark McLoughlin
}
79 5281d757 Mark McLoughlin
80 5281d757 Mark McLoughlin
static void tap_read_poll(TAPState *s, int enable)
81 5281d757 Mark McLoughlin
{
82 5281d757 Mark McLoughlin
    s->read_poll = !!enable;
83 5281d757 Mark McLoughlin
    tap_update_fd_handler(s);
84 5281d757 Mark McLoughlin
}
85 5281d757 Mark McLoughlin
86 5281d757 Mark McLoughlin
static void tap_write_poll(TAPState *s, int enable)
87 5281d757 Mark McLoughlin
{
88 5281d757 Mark McLoughlin
    s->write_poll = !!enable;
89 5281d757 Mark McLoughlin
    tap_update_fd_handler(s);
90 5281d757 Mark McLoughlin
}
91 5281d757 Mark McLoughlin
92 5281d757 Mark McLoughlin
static void tap_writable(void *opaque)
93 5281d757 Mark McLoughlin
{
94 5281d757 Mark McLoughlin
    TAPState *s = opaque;
95 5281d757 Mark McLoughlin
96 5281d757 Mark McLoughlin
    tap_write_poll(s, 0);
97 5281d757 Mark McLoughlin
98 3e35ba93 Mark McLoughlin
    qemu_flush_queued_packets(&s->nc);
99 5281d757 Mark McLoughlin
}
100 5281d757 Mark McLoughlin
101 5281d757 Mark McLoughlin
static ssize_t tap_write_packet(TAPState *s, const struct iovec *iov, int iovcnt)
102 5281d757 Mark McLoughlin
{
103 5281d757 Mark McLoughlin
    ssize_t len;
104 5281d757 Mark McLoughlin
105 5281d757 Mark McLoughlin
    do {
106 5281d757 Mark McLoughlin
        len = writev(s->fd, iov, iovcnt);
107 5281d757 Mark McLoughlin
    } while (len == -1 && errno == EINTR);
108 5281d757 Mark McLoughlin
109 5281d757 Mark McLoughlin
    if (len == -1 && errno == EAGAIN) {
110 5281d757 Mark McLoughlin
        tap_write_poll(s, 1);
111 5281d757 Mark McLoughlin
        return 0;
112 5281d757 Mark McLoughlin
    }
113 5281d757 Mark McLoughlin
114 5281d757 Mark McLoughlin
    return len;
115 5281d757 Mark McLoughlin
}
116 5281d757 Mark McLoughlin
117 3e35ba93 Mark McLoughlin
static ssize_t tap_receive_iov(VLANClientState *nc, const struct iovec *iov,
118 5281d757 Mark McLoughlin
                               int iovcnt)
119 5281d757 Mark McLoughlin
{
120 3e35ba93 Mark McLoughlin
    TAPState *s = DO_UPCAST(TAPState, nc, nc);
121 5281d757 Mark McLoughlin
    const struct iovec *iovp = iov;
122 5281d757 Mark McLoughlin
    struct iovec iov_copy[iovcnt + 1];
123 ef4252b1 Michael S. Tsirkin
    struct virtio_net_hdr_mrg_rxbuf hdr = { };
124 5281d757 Mark McLoughlin
125 ef4252b1 Michael S. Tsirkin
    if (s->host_vnet_hdr_len && !s->using_vnet_hdr) {
126 5281d757 Mark McLoughlin
        iov_copy[0].iov_base = &hdr;
127 ef4252b1 Michael S. Tsirkin
        iov_copy[0].iov_len =  s->host_vnet_hdr_len;
128 5281d757 Mark McLoughlin
        memcpy(&iov_copy[1], iov, iovcnt * sizeof(*iov));
129 5281d757 Mark McLoughlin
        iovp = iov_copy;
130 5281d757 Mark McLoughlin
        iovcnt++;
131 5281d757 Mark McLoughlin
    }
132 5281d757 Mark McLoughlin
133 5281d757 Mark McLoughlin
    return tap_write_packet(s, iovp, iovcnt);
134 5281d757 Mark McLoughlin
}
135 5281d757 Mark McLoughlin
136 3e35ba93 Mark McLoughlin
static ssize_t tap_receive_raw(VLANClientState *nc, const uint8_t *buf, size_t size)
137 5281d757 Mark McLoughlin
{
138 3e35ba93 Mark McLoughlin
    TAPState *s = DO_UPCAST(TAPState, nc, nc);
139 5281d757 Mark McLoughlin
    struct iovec iov[2];
140 5281d757 Mark McLoughlin
    int iovcnt = 0;
141 ef4252b1 Michael S. Tsirkin
    struct virtio_net_hdr_mrg_rxbuf hdr = { };
142 5281d757 Mark McLoughlin
143 ef4252b1 Michael S. Tsirkin
    if (s->host_vnet_hdr_len) {
144 5281d757 Mark McLoughlin
        iov[iovcnt].iov_base = &hdr;
145 ef4252b1 Michael S. Tsirkin
        iov[iovcnt].iov_len  = s->host_vnet_hdr_len;
146 5281d757 Mark McLoughlin
        iovcnt++;
147 5281d757 Mark McLoughlin
    }
148 5281d757 Mark McLoughlin
149 5281d757 Mark McLoughlin
    iov[iovcnt].iov_base = (char *)buf;
150 5281d757 Mark McLoughlin
    iov[iovcnt].iov_len  = size;
151 5281d757 Mark McLoughlin
    iovcnt++;
152 5281d757 Mark McLoughlin
153 5281d757 Mark McLoughlin
    return tap_write_packet(s, iov, iovcnt);
154 5281d757 Mark McLoughlin
}
155 5281d757 Mark McLoughlin
156 3e35ba93 Mark McLoughlin
static ssize_t tap_receive(VLANClientState *nc, const uint8_t *buf, size_t size)
157 5281d757 Mark McLoughlin
{
158 3e35ba93 Mark McLoughlin
    TAPState *s = DO_UPCAST(TAPState, nc, nc);
159 5281d757 Mark McLoughlin
    struct iovec iov[1];
160 5281d757 Mark McLoughlin
161 ef4252b1 Michael S. Tsirkin
    if (s->host_vnet_hdr_len && !s->using_vnet_hdr) {
162 3e35ba93 Mark McLoughlin
        return tap_receive_raw(nc, buf, size);
163 5281d757 Mark McLoughlin
    }
164 5281d757 Mark McLoughlin
165 5281d757 Mark McLoughlin
    iov[0].iov_base = (char *)buf;
166 5281d757 Mark McLoughlin
    iov[0].iov_len  = size;
167 5281d757 Mark McLoughlin
168 5281d757 Mark McLoughlin
    return tap_write_packet(s, iov, 1);
169 5281d757 Mark McLoughlin
}
170 5281d757 Mark McLoughlin
171 5281d757 Mark McLoughlin
static int tap_can_send(void *opaque)
172 5281d757 Mark McLoughlin
{
173 5281d757 Mark McLoughlin
    TAPState *s = opaque;
174 5281d757 Mark McLoughlin
175 3e35ba93 Mark McLoughlin
    return qemu_can_send_packet(&s->nc);
176 5281d757 Mark McLoughlin
}
177 5281d757 Mark McLoughlin
178 966ea5ec Mark McLoughlin
#ifndef __sun__
179 966ea5ec Mark McLoughlin
ssize_t tap_read_packet(int tapfd, uint8_t *buf, int maxlen)
180 5281d757 Mark McLoughlin
{
181 5281d757 Mark McLoughlin
    return read(tapfd, buf, maxlen);
182 5281d757 Mark McLoughlin
}
183 5281d757 Mark McLoughlin
#endif
184 5281d757 Mark McLoughlin
185 3e35ba93 Mark McLoughlin
static void tap_send_completed(VLANClientState *nc, ssize_t len)
186 5281d757 Mark McLoughlin
{
187 3e35ba93 Mark McLoughlin
    TAPState *s = DO_UPCAST(TAPState, nc, nc);
188 5281d757 Mark McLoughlin
    tap_read_poll(s, 1);
189 5281d757 Mark McLoughlin
}
190 5281d757 Mark McLoughlin
191 5281d757 Mark McLoughlin
static void tap_send(void *opaque)
192 5281d757 Mark McLoughlin
{
193 5281d757 Mark McLoughlin
    TAPState *s = opaque;
194 5281d757 Mark McLoughlin
    int size;
195 5281d757 Mark McLoughlin
196 5819c918 Mark McLoughlin
    do {
197 5819c918 Mark McLoughlin
        uint8_t *buf = s->buf;
198 5819c918 Mark McLoughlin
199 5819c918 Mark McLoughlin
        size = tap_read_packet(s->fd, s->buf, sizeof(s->buf));
200 5819c918 Mark McLoughlin
        if (size <= 0) {
201 5819c918 Mark McLoughlin
            break;
202 5819c918 Mark McLoughlin
        }
203 5819c918 Mark McLoughlin
204 ef4252b1 Michael S. Tsirkin
        if (s->host_vnet_hdr_len && !s->using_vnet_hdr) {
205 ef4252b1 Michael S. Tsirkin
            buf  += s->host_vnet_hdr_len;
206 ef4252b1 Michael S. Tsirkin
            size -= s->host_vnet_hdr_len;
207 5819c918 Mark McLoughlin
        }
208 5819c918 Mark McLoughlin
209 3e35ba93 Mark McLoughlin
        size = qemu_send_packet_async(&s->nc, buf, size, tap_send_completed);
210 5819c918 Mark McLoughlin
        if (size == 0) {
211 5819c918 Mark McLoughlin
            tap_read_poll(s, 0);
212 5819c918 Mark McLoughlin
        }
213 3e35ba93 Mark McLoughlin
    } while (size > 0 && qemu_can_send_packet(&s->nc));
214 5281d757 Mark McLoughlin
}
215 5281d757 Mark McLoughlin
216 3e35ba93 Mark McLoughlin
int tap_has_ufo(VLANClientState *nc)
217 5281d757 Mark McLoughlin
{
218 3e35ba93 Mark McLoughlin
    TAPState *s = DO_UPCAST(TAPState, nc, nc);
219 5281d757 Mark McLoughlin
220 665a3b07 Mark McLoughlin
    assert(nc->info->type == NET_CLIENT_TYPE_TAP);
221 5281d757 Mark McLoughlin
222 5281d757 Mark McLoughlin
    return s->has_ufo;
223 5281d757 Mark McLoughlin
}
224 5281d757 Mark McLoughlin
225 3e35ba93 Mark McLoughlin
int tap_has_vnet_hdr(VLANClientState *nc)
226 5281d757 Mark McLoughlin
{
227 3e35ba93 Mark McLoughlin
    TAPState *s = DO_UPCAST(TAPState, nc, nc);
228 5281d757 Mark McLoughlin
229 665a3b07 Mark McLoughlin
    assert(nc->info->type == NET_CLIENT_TYPE_TAP);
230 5281d757 Mark McLoughlin
231 ef4252b1 Michael S. Tsirkin
    return !!s->host_vnet_hdr_len;
232 5281d757 Mark McLoughlin
}
233 5281d757 Mark McLoughlin
234 445d892f Michael S. Tsirkin
int tap_has_vnet_hdr_len(VLANClientState *nc, int len)
235 445d892f Michael S. Tsirkin
{
236 445d892f Michael S. Tsirkin
    TAPState *s = DO_UPCAST(TAPState, nc, nc);
237 445d892f Michael S. Tsirkin
238 445d892f Michael S. Tsirkin
    assert(nc->info->type == NET_CLIENT_TYPE_TAP);
239 445d892f Michael S. Tsirkin
240 445d892f Michael S. Tsirkin
    return tap_probe_vnet_hdr_len(s->fd, len);
241 445d892f Michael S. Tsirkin
}
242 445d892f Michael S. Tsirkin
243 445d892f Michael S. Tsirkin
void tap_set_vnet_hdr_len(VLANClientState *nc, int len)
244 445d892f Michael S. Tsirkin
{
245 445d892f Michael S. Tsirkin
    TAPState *s = DO_UPCAST(TAPState, nc, nc);
246 445d892f Michael S. Tsirkin
247 445d892f Michael S. Tsirkin
    assert(nc->info->type == NET_CLIENT_TYPE_TAP);
248 445d892f Michael S. Tsirkin
    assert(len == sizeof(struct virtio_net_hdr_mrg_rxbuf) ||
249 445d892f Michael S. Tsirkin
           len == sizeof(struct virtio_net_hdr));
250 445d892f Michael S. Tsirkin
251 445d892f Michael S. Tsirkin
    tap_fd_set_vnet_hdr_len(s->fd, len);
252 445d892f Michael S. Tsirkin
    s->host_vnet_hdr_len = len;
253 445d892f Michael S. Tsirkin
}
254 445d892f Michael S. Tsirkin
255 3e35ba93 Mark McLoughlin
void tap_using_vnet_hdr(VLANClientState *nc, int using_vnet_hdr)
256 5281d757 Mark McLoughlin
{
257 3e35ba93 Mark McLoughlin
    TAPState *s = DO_UPCAST(TAPState, nc, nc);
258 5281d757 Mark McLoughlin
259 5281d757 Mark McLoughlin
    using_vnet_hdr = using_vnet_hdr != 0;
260 5281d757 Mark McLoughlin
261 665a3b07 Mark McLoughlin
    assert(nc->info->type == NET_CLIENT_TYPE_TAP);
262 ef4252b1 Michael S. Tsirkin
    assert(!!s->host_vnet_hdr_len == using_vnet_hdr);
263 5281d757 Mark McLoughlin
264 5281d757 Mark McLoughlin
    s->using_vnet_hdr = using_vnet_hdr;
265 5281d757 Mark McLoughlin
}
266 5281d757 Mark McLoughlin
267 3e35ba93 Mark McLoughlin
void tap_set_offload(VLANClientState *nc, int csum, int tso4,
268 5281d757 Mark McLoughlin
                     int tso6, int ecn, int ufo)
269 5281d757 Mark McLoughlin
{
270 3e35ba93 Mark McLoughlin
    TAPState *s = DO_UPCAST(TAPState, nc, nc);
271 27a6375d Michael S. Tsirkin
    if (s->fd < 0) {
272 27a6375d Michael S. Tsirkin
        return;
273 27a6375d Michael S. Tsirkin
    }
274 5281d757 Mark McLoughlin
275 27a6375d Michael S. Tsirkin
    tap_fd_set_offload(s->fd, csum, tso4, tso6, ecn, ufo);
276 5281d757 Mark McLoughlin
}
277 5281d757 Mark McLoughlin
278 3e35ba93 Mark McLoughlin
static void tap_cleanup(VLANClientState *nc)
279 5281d757 Mark McLoughlin
{
280 3e35ba93 Mark McLoughlin
    TAPState *s = DO_UPCAST(TAPState, nc, nc);
281 5281d757 Mark McLoughlin
282 82b0d80e Michael S. Tsirkin
    if (s->vhost_net) {
283 82b0d80e Michael S. Tsirkin
        vhost_net_cleanup(s->vhost_net);
284 43849424 Michael S. Tsirkin
        s->vhost_net = NULL;
285 82b0d80e Michael S. Tsirkin
    }
286 82b0d80e Michael S. Tsirkin
287 3e35ba93 Mark McLoughlin
    qemu_purge_queued_packets(nc);
288 5281d757 Mark McLoughlin
289 5281d757 Mark McLoughlin
    if (s->down_script[0])
290 5281d757 Mark McLoughlin
        launch_script(s->down_script, s->down_script_arg, s->fd);
291 5281d757 Mark McLoughlin
292 5281d757 Mark McLoughlin
    tap_read_poll(s, 0);
293 5281d757 Mark McLoughlin
    tap_write_poll(s, 0);
294 5281d757 Mark McLoughlin
    close(s->fd);
295 27a6375d Michael S. Tsirkin
    s->fd = -1;
296 5281d757 Mark McLoughlin
}
297 5281d757 Mark McLoughlin
298 ceb69615 Michael S. Tsirkin
static void tap_poll(VLANClientState *nc, bool enable)
299 ceb69615 Michael S. Tsirkin
{
300 ceb69615 Michael S. Tsirkin
    TAPState *s = DO_UPCAST(TAPState, nc, nc);
301 ceb69615 Michael S. Tsirkin
    tap_read_poll(s, enable);
302 ceb69615 Michael S. Tsirkin
    tap_write_poll(s, enable);
303 ceb69615 Michael S. Tsirkin
}
304 ceb69615 Michael S. Tsirkin
305 95d528a2 Michael S. Tsirkin
int tap_get_fd(VLANClientState *nc)
306 95d528a2 Michael S. Tsirkin
{
307 95d528a2 Michael S. Tsirkin
    TAPState *s = DO_UPCAST(TAPState, nc, nc);
308 95d528a2 Michael S. Tsirkin
    assert(nc->info->type == NET_CLIENT_TYPE_TAP);
309 95d528a2 Michael S. Tsirkin
    return s->fd;
310 95d528a2 Michael S. Tsirkin
}
311 95d528a2 Michael S. Tsirkin
312 5281d757 Mark McLoughlin
/* fd support */
313 5281d757 Mark McLoughlin
314 3e35ba93 Mark McLoughlin
static NetClientInfo net_tap_info = {
315 3e35ba93 Mark McLoughlin
    .type = NET_CLIENT_TYPE_TAP,
316 3e35ba93 Mark McLoughlin
    .size = sizeof(TAPState),
317 3e35ba93 Mark McLoughlin
    .receive = tap_receive,
318 3e35ba93 Mark McLoughlin
    .receive_raw = tap_receive_raw,
319 3e35ba93 Mark McLoughlin
    .receive_iov = tap_receive_iov,
320 ceb69615 Michael S. Tsirkin
    .poll = tap_poll,
321 3e35ba93 Mark McLoughlin
    .cleanup = tap_cleanup,
322 3e35ba93 Mark McLoughlin
};
323 3e35ba93 Mark McLoughlin
324 5281d757 Mark McLoughlin
static TAPState *net_tap_fd_init(VLANState *vlan,
325 5281d757 Mark McLoughlin
                                 const char *model,
326 5281d757 Mark McLoughlin
                                 const char *name,
327 5281d757 Mark McLoughlin
                                 int fd,
328 5281d757 Mark McLoughlin
                                 int vnet_hdr)
329 5281d757 Mark McLoughlin
{
330 3e35ba93 Mark McLoughlin
    VLANClientState *nc;
331 5281d757 Mark McLoughlin
    TAPState *s;
332 5281d757 Mark McLoughlin
333 3e35ba93 Mark McLoughlin
    nc = qemu_new_net_client(&net_tap_info, vlan, NULL, model, name);
334 3e35ba93 Mark McLoughlin
335 3e35ba93 Mark McLoughlin
    s = DO_UPCAST(TAPState, nc, nc);
336 3e35ba93 Mark McLoughlin
337 5281d757 Mark McLoughlin
    s->fd = fd;
338 ef4252b1 Michael S. Tsirkin
    s->host_vnet_hdr_len = vnet_hdr ? sizeof(struct virtio_net_hdr) : 0;
339 5281d757 Mark McLoughlin
    s->using_vnet_hdr = 0;
340 9c282718 Mark McLoughlin
    s->has_ufo = tap_probe_has_ufo(s->fd);
341 3e35ba93 Mark McLoughlin
    tap_set_offload(&s->nc, 0, 0, 0, 0, 0);
342 5281d757 Mark McLoughlin
    tap_read_poll(s, 1);
343 82b0d80e Michael S. Tsirkin
    s->vhost_net = NULL;
344 5281d757 Mark McLoughlin
    return s;
345 5281d757 Mark McLoughlin
}
346 5281d757 Mark McLoughlin
347 5281d757 Mark McLoughlin
static int launch_script(const char *setup_script, const char *ifname, int fd)
348 5281d757 Mark McLoughlin
{
349 5281d757 Mark McLoughlin
    sigset_t oldmask, mask;
350 5281d757 Mark McLoughlin
    int pid, status;
351 5281d757 Mark McLoughlin
    char *args[3];
352 5281d757 Mark McLoughlin
    char **parg;
353 5281d757 Mark McLoughlin
354 5281d757 Mark McLoughlin
    sigemptyset(&mask);
355 5281d757 Mark McLoughlin
    sigaddset(&mask, SIGCHLD);
356 5281d757 Mark McLoughlin
    sigprocmask(SIG_BLOCK, &mask, &oldmask);
357 5281d757 Mark McLoughlin
358 5281d757 Mark McLoughlin
    /* try to launch network script */
359 5281d757 Mark McLoughlin
    pid = fork();
360 5281d757 Mark McLoughlin
    if (pid == 0) {
361 5281d757 Mark McLoughlin
        int open_max = sysconf(_SC_OPEN_MAX), i;
362 5281d757 Mark McLoughlin
363 5281d757 Mark McLoughlin
        for (i = 0; i < open_max; i++) {
364 5281d757 Mark McLoughlin
            if (i != STDIN_FILENO &&
365 5281d757 Mark McLoughlin
                i != STDOUT_FILENO &&
366 5281d757 Mark McLoughlin
                i != STDERR_FILENO &&
367 5281d757 Mark McLoughlin
                i != fd) {
368 5281d757 Mark McLoughlin
                close(i);
369 5281d757 Mark McLoughlin
            }
370 5281d757 Mark McLoughlin
        }
371 5281d757 Mark McLoughlin
        parg = args;
372 5281d757 Mark McLoughlin
        *parg++ = (char *)setup_script;
373 5281d757 Mark McLoughlin
        *parg++ = (char *)ifname;
374 9678d950 Blue Swirl
        *parg = NULL;
375 5281d757 Mark McLoughlin
        execv(setup_script, args);
376 5281d757 Mark McLoughlin
        _exit(1);
377 5281d757 Mark McLoughlin
    } else if (pid > 0) {
378 5281d757 Mark McLoughlin
        while (waitpid(pid, &status, 0) != pid) {
379 5281d757 Mark McLoughlin
            /* loop */
380 5281d757 Mark McLoughlin
        }
381 5281d757 Mark McLoughlin
        sigprocmask(SIG_SETMASK, &oldmask, NULL);
382 5281d757 Mark McLoughlin
383 5281d757 Mark McLoughlin
        if (WIFEXITED(status) && WEXITSTATUS(status) == 0) {
384 5281d757 Mark McLoughlin
            return 0;
385 5281d757 Mark McLoughlin
        }
386 5281d757 Mark McLoughlin
    }
387 5281d757 Mark McLoughlin
    fprintf(stderr, "%s: could not launch network script\n", setup_script);
388 5281d757 Mark McLoughlin
    return -1;
389 5281d757 Mark McLoughlin
}
390 5281d757 Mark McLoughlin
391 5281d757 Mark McLoughlin
static int net_tap_init(QemuOpts *opts, int *vnet_hdr)
392 5281d757 Mark McLoughlin
{
393 5281d757 Mark McLoughlin
    int fd, vnet_hdr_required;
394 5281d757 Mark McLoughlin
    char ifname[128] = {0,};
395 5281d757 Mark McLoughlin
    const char *setup_script;
396 5281d757 Mark McLoughlin
397 5281d757 Mark McLoughlin
    if (qemu_opt_get(opts, "ifname")) {
398 5281d757 Mark McLoughlin
        pstrcpy(ifname, sizeof(ifname), qemu_opt_get(opts, "ifname"));
399 5281d757 Mark McLoughlin
    }
400 5281d757 Mark McLoughlin
401 5281d757 Mark McLoughlin
    *vnet_hdr = qemu_opt_get_bool(opts, "vnet_hdr", 1);
402 5281d757 Mark McLoughlin
    if (qemu_opt_get(opts, "vnet_hdr")) {
403 5281d757 Mark McLoughlin
        vnet_hdr_required = *vnet_hdr;
404 5281d757 Mark McLoughlin
    } else {
405 5281d757 Mark McLoughlin
        vnet_hdr_required = 0;
406 5281d757 Mark McLoughlin
    }
407 5281d757 Mark McLoughlin
408 5281d757 Mark McLoughlin
    TFR(fd = tap_open(ifname, sizeof(ifname), vnet_hdr, vnet_hdr_required));
409 5281d757 Mark McLoughlin
    if (fd < 0) {
410 5281d757 Mark McLoughlin
        return -1;
411 5281d757 Mark McLoughlin
    }
412 5281d757 Mark McLoughlin
413 5281d757 Mark McLoughlin
    setup_script = qemu_opt_get(opts, "script");
414 5281d757 Mark McLoughlin
    if (setup_script &&
415 5281d757 Mark McLoughlin
        setup_script[0] != '\0' &&
416 5281d757 Mark McLoughlin
        strcmp(setup_script, "no") != 0 &&
417 5281d757 Mark McLoughlin
        launch_script(setup_script, ifname, fd)) {
418 5281d757 Mark McLoughlin
        close(fd);
419 5281d757 Mark McLoughlin
        return -1;
420 5281d757 Mark McLoughlin
    }
421 5281d757 Mark McLoughlin
422 5281d757 Mark McLoughlin
    qemu_opt_set(opts, "ifname", ifname);
423 5281d757 Mark McLoughlin
424 5281d757 Mark McLoughlin
    return fd;
425 5281d757 Mark McLoughlin
}
426 5281d757 Mark McLoughlin
427 5281d757 Mark McLoughlin
int net_init_tap(QemuOpts *opts, Monitor *mon, const char *name, VLANState *vlan)
428 5281d757 Mark McLoughlin
{
429 5281d757 Mark McLoughlin
    TAPState *s;
430 df6c2a0f Mark McLoughlin
    int fd, vnet_hdr = 0;
431 5281d757 Mark McLoughlin
432 5281d757 Mark McLoughlin
    if (qemu_opt_get(opts, "fd")) {
433 5281d757 Mark McLoughlin
        if (qemu_opt_get(opts, "ifname") ||
434 5281d757 Mark McLoughlin
            qemu_opt_get(opts, "script") ||
435 5281d757 Mark McLoughlin
            qemu_opt_get(opts, "downscript") ||
436 5281d757 Mark McLoughlin
            qemu_opt_get(opts, "vnet_hdr")) {
437 1ecda02b Markus Armbruster
            error_report("ifname=, script=, downscript= and vnet_hdr= is invalid with fd=");
438 5281d757 Mark McLoughlin
            return -1;
439 5281d757 Mark McLoughlin
        }
440 5281d757 Mark McLoughlin
441 5281d757 Mark McLoughlin
        fd = net_handle_fd_param(mon, qemu_opt_get(opts, "fd"));
442 5281d757 Mark McLoughlin
        if (fd == -1) {
443 5281d757 Mark McLoughlin
            return -1;
444 5281d757 Mark McLoughlin
        }
445 5281d757 Mark McLoughlin
446 5281d757 Mark McLoughlin
        fcntl(fd, F_SETFL, O_NONBLOCK);
447 5281d757 Mark McLoughlin
448 5281d757 Mark McLoughlin
        vnet_hdr = tap_probe_vnet_hdr(fd);
449 5281d757 Mark McLoughlin
    } else {
450 5281d757 Mark McLoughlin
        if (!qemu_opt_get(opts, "script")) {
451 5281d757 Mark McLoughlin
            qemu_opt_set(opts, "script", DEFAULT_NETWORK_SCRIPT);
452 5281d757 Mark McLoughlin
        }
453 5281d757 Mark McLoughlin
454 5281d757 Mark McLoughlin
        if (!qemu_opt_get(opts, "downscript")) {
455 5281d757 Mark McLoughlin
            qemu_opt_set(opts, "downscript", DEFAULT_NETWORK_DOWN_SCRIPT);
456 5281d757 Mark McLoughlin
        }
457 5281d757 Mark McLoughlin
458 5281d757 Mark McLoughlin
        fd = net_tap_init(opts, &vnet_hdr);
459 929fe497 Juergen Lock
        if (fd == -1) {
460 929fe497 Juergen Lock
            return -1;
461 929fe497 Juergen Lock
        }
462 5281d757 Mark McLoughlin
    }
463 5281d757 Mark McLoughlin
464 5281d757 Mark McLoughlin
    s = net_tap_fd_init(vlan, "tap", name, fd, vnet_hdr);
465 5281d757 Mark McLoughlin
    if (!s) {
466 5281d757 Mark McLoughlin
        close(fd);
467 5281d757 Mark McLoughlin
        return -1;
468 5281d757 Mark McLoughlin
    }
469 5281d757 Mark McLoughlin
470 15ac913b Mark McLoughlin
    if (tap_set_sndbuf(s->fd, opts) < 0) {
471 5281d757 Mark McLoughlin
        return -1;
472 5281d757 Mark McLoughlin
    }
473 5281d757 Mark McLoughlin
474 5281d757 Mark McLoughlin
    if (qemu_opt_get(opts, "fd")) {
475 3e35ba93 Mark McLoughlin
        snprintf(s->nc.info_str, sizeof(s->nc.info_str), "fd=%d", fd);
476 5281d757 Mark McLoughlin
    } else {
477 5281d757 Mark McLoughlin
        const char *ifname, *script, *downscript;
478 5281d757 Mark McLoughlin
479 5281d757 Mark McLoughlin
        ifname     = qemu_opt_get(opts, "ifname");
480 5281d757 Mark McLoughlin
        script     = qemu_opt_get(opts, "script");
481 5281d757 Mark McLoughlin
        downscript = qemu_opt_get(opts, "downscript");
482 5281d757 Mark McLoughlin
483 3e35ba93 Mark McLoughlin
        snprintf(s->nc.info_str, sizeof(s->nc.info_str),
484 5281d757 Mark McLoughlin
                 "ifname=%s,script=%s,downscript=%s",
485 5281d757 Mark McLoughlin
                 ifname, script, downscript);
486 5281d757 Mark McLoughlin
487 5281d757 Mark McLoughlin
        if (strcmp(downscript, "no") != 0) {
488 5281d757 Mark McLoughlin
            snprintf(s->down_script, sizeof(s->down_script), "%s", downscript);
489 5281d757 Mark McLoughlin
            snprintf(s->down_script_arg, sizeof(s->down_script_arg), "%s", ifname);
490 5281d757 Mark McLoughlin
        }
491 5281d757 Mark McLoughlin
    }
492 5281d757 Mark McLoughlin
493 5430a28f mst@redhat.com
    if (qemu_opt_get_bool(opts, "vhost", !!qemu_opt_get(opts, "vhostfd") ||
494 5430a28f mst@redhat.com
                          qemu_opt_get_bool(opts, "vhostforce", false))) {
495 82b0d80e Michael S. Tsirkin
        int vhostfd, r;
496 5430a28f mst@redhat.com
        bool force = qemu_opt_get_bool(opts, "vhostforce", false);
497 82b0d80e Michael S. Tsirkin
        if (qemu_opt_get(opts, "vhostfd")) {
498 82b0d80e Michael S. Tsirkin
            r = net_handle_fd_param(mon, qemu_opt_get(opts, "vhostfd"));
499 82b0d80e Michael S. Tsirkin
            if (r == -1) {
500 82b0d80e Michael S. Tsirkin
                return -1;
501 82b0d80e Michael S. Tsirkin
            }
502 82b0d80e Michael S. Tsirkin
            vhostfd = r;
503 82b0d80e Michael S. Tsirkin
        } else {
504 82b0d80e Michael S. Tsirkin
            vhostfd = -1;
505 82b0d80e Michael S. Tsirkin
        }
506 5430a28f mst@redhat.com
        s->vhost_net = vhost_net_init(&s->nc, vhostfd, force);
507 82b0d80e Michael S. Tsirkin
        if (!s->vhost_net) {
508 82b0d80e Michael S. Tsirkin
            error_report("vhost-net requested but could not be initialized");
509 82b0d80e Michael S. Tsirkin
            return -1;
510 82b0d80e Michael S. Tsirkin
        }
511 82b0d80e Michael S. Tsirkin
    } else if (qemu_opt_get(opts, "vhostfd")) {
512 82b0d80e Michael S. Tsirkin
        error_report("vhostfd= is not valid without vhost");
513 82b0d80e Michael S. Tsirkin
        return -1;
514 82b0d80e Michael S. Tsirkin
    }
515 82b0d80e Michael S. Tsirkin
516 5281d757 Mark McLoughlin
    return 0;
517 5281d757 Mark McLoughlin
}
518 b202554c Michael S. Tsirkin
519 b202554c Michael S. Tsirkin
VHostNetState *tap_get_vhost_net(VLANClientState *nc)
520 b202554c Michael S. Tsirkin
{
521 b202554c Michael S. Tsirkin
    TAPState *s = DO_UPCAST(TAPState, nc, nc);
522 b202554c Michael S. Tsirkin
    assert(nc->info->type == NET_CLIENT_TYPE_TAP);
523 b202554c Michael S. Tsirkin
    return s->vhost_net;
524 b202554c Michael S. Tsirkin
}