2 * Copyright (c) 2007 The DragonFly Project. All rights reserved.
4 * This code is derived from software contributed to The DragonFly Project
5 * by Sepherosa Ziehau <sepherosa@gmail.com>
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in
15 * the documentation and/or other materials provided with the
17 * 3. Neither the name of The DragonFly Project nor the names of its
18 * contributors may be used to endorse or promote products derived
19 * from this software without specific, prior written permission.
21 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
22 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
23 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
24 * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
25 * COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
26 * INCIDENTAL, SPECIAL, EXEMPLARY OR CONSEQUENTIAL DAMAGES (INCLUDING,
27 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
28 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
29 * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
30 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
31 * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
34 * $DragonFly: src/sys/dev/virtual/net/if_vke.c,v 1.10 2008/05/27 23:44:46 dillon Exp $
37 #include <sys/param.h>
38 #include <sys/endian.h>
39 #include <sys/kernel.h>
40 #include <sys/malloc.h>
42 #include <sys/serialize.h>
43 #include <sys/socket.h>
44 #include <sys/sockio.h>
45 #include <sys/sysctl.h>
47 #include <machine/md_var.h>
49 #include <net/ethernet.h>
52 #include <net/if_arp.h>
53 #include <net/ifq_var.h>
55 #include <netinet/in_var.h>
58 #include <net/tap/if_tap.h>
65 #define VKE_DEVNAME "vke"
72 struct kqueue_info *sc_kqueue;
75 struct mbuf *sc_rx_mbuf;
77 struct sysctl_ctx_list sc_sysctl_ctx;
78 struct sysctl_oid *sc_sysctl_tree;
80 int sc_tap_unit; /* unit of backend tap(4) */
81 in_addr_t sc_addr; /* address */
82 in_addr_t sc_mask; /* netmask */
85 static void vke_start(struct ifnet *);
86 static void vke_init(void *);
87 static int vke_ioctl(struct ifnet *, u_long, caddr_t, struct ucred *);
89 static int vke_attach(const struct vknetif_info *, int);
90 static void vke_intr(void *, struct intrframe *);
91 static int vke_stop(struct vke_softc *);
92 static void vke_rxeof(struct vke_softc *);
93 static int vke_init_addr(struct ifnet *, in_addr_t, in_addr_t);
96 vke_sysinit(void *arg __unused)
100 KASSERT(NetifNum <= VKNETIF_MAX, ("too many netifs: %d\n", NetifNum));
103 for (i = 0; i < NetifNum; ++i) {
104 if (vke_attach(&NetifInfo[i], unit) == 0)
108 SYSINIT(vke, SI_SUB_DRIVERS, SI_ORDER_MIDDLE, vke_sysinit, NULL);
113 struct vke_softc *sc = xsc;
114 struct ifnet *ifp = &sc->arpcom.ac_if;
116 ASSERT_SERIALIZED(ifp->if_serializer);
120 KKASSERT(sc->sc_kqueue == NULL);
121 sc->sc_kqueue = kqueue_add(sc->sc_fd, vke_intr, sc);
122 KKASSERT(sc->sc_kqueue != NULL);
124 ifp->if_flags |= IFF_RUNNING;
125 ifp->if_flags &= ~IFF_OACTIVE;
127 if (sc->sc_addr != 0) {
128 in_addr_t addr, mask;
134 * Make sure vkernel assigned
135 * address will not be added
141 vke_init_addr(ifp, addr, mask);
148 vke_start(struct ifnet *ifp)
150 struct vke_softc *sc = ifp->if_softc;
153 ASSERT_SERIALIZED(ifp->if_serializer);
155 if ((ifp->if_flags & (IFF_RUNNING | IFF_OACTIVE)) != IFF_RUNNING)
158 while ((m = ifq_dequeue(&ifp->if_snd, NULL)) != NULL) {
160 * Copy the data into a single mbuf and write it out
163 if (m->m_pkthdr.len <= MCLBYTES) {
164 m_copydata(m, 0, m->m_pkthdr.len, sc->sc_txbuf);
166 if (write(sc->sc_fd, sc->sc_txbuf, m->m_pkthdr.len) < 0)
178 vke_ioctl(struct ifnet *ifp, u_long cmd, caddr_t data, struct ucred *cr)
180 struct vke_softc *sc = ifp->if_softc;
183 ASSERT_SERIALIZED(ifp->if_serializer);
187 if (ifp->if_flags & IFF_UP) {
188 if ((ifp->if_flags & IFF_RUNNING) == 0)
191 if (ifp->if_flags & IFF_RUNNING)
200 case SIOCGIFSTATUS: {
201 struct ifstat *ifs = (struct ifstat *)data;
204 len = strlen(ifs->ascii);
205 if (len < sizeof(ifs->ascii)) {
206 ksnprintf(ifs->ascii + len, sizeof(ifs->ascii) - len,
207 "\tBacked by tap%d\n", sc->sc_tap_unit);
212 if (((struct ifaddr *)data)->ifa_addr->sa_family == AF_INET) {
214 * If we are explicitly requested to change address,
215 * we should invalidate address/netmask passed in
216 * from vkernel command line.
223 error = ether_ioctl(ifp, cmd, data);
230 vke_stop(struct vke_softc *sc)
232 struct ifnet *ifp = &sc->arpcom.ac_if;
234 ASSERT_SERIALIZED(ifp->if_serializer);
236 ifp->if_flags &= ~(IFF_RUNNING | IFF_OACTIVE);
238 kqueue_del(sc->sc_kqueue);
239 sc->sc_kqueue = NULL;
242 if (sc->sc_rx_mbuf != NULL) {
243 m_freem(sc->sc_rx_mbuf);
244 sc->sc_rx_mbuf = NULL;
250 vke_intr(void *xsc, struct intrframe *frame __unused)
252 struct vke_softc *sc = xsc;
253 struct ifnet *ifp = &sc->arpcom.ac_if;
255 ifnet_serialize_all(ifp);
257 if ((ifp->if_flags & IFF_RUNNING) == 0)
265 ifnet_deserialize_all(ifp);
269 vke_rxeof(struct vke_softc *sc)
271 struct ifnet *ifp = &sc->arpcom.ac_if;
274 ASSERT_SERIALIZED(ifp->if_serializer);
282 if ((m = sc->sc_rx_mbuf) == NULL)
283 m = m_getcl(MB_DONTWAIT, MT_DATA, M_PKTHDR);
285 sc->sc_rx_mbuf = NULL;
288 * Drain the interface whether we get an mbuf or not or
289 * we might stop receiving interrupts.
292 n = read(sc->sc_fd, mtod(m, void *), MCLBYTES);
294 n = read(sc->sc_fd, sc->sc_txbuf, MCLBYTES);
297 sc->sc_rx_mbuf = m; /* We can use it next time */
302 m->m_pkthdr.rcvif = ifp;
303 m->m_pkthdr.len = m->m_len = n;
304 ifp->if_input(ifp, m);
312 vke_attach(const struct vknetif_info *info, int unit)
314 struct vke_softc *sc;
316 struct tapinfo tapinfo;
317 uint8_t enaddr[ETHER_ADDR_LEN];
320 KKASSERT(info->tap_fd >= 0);
324 * This is only a TAP device if tap_unit is non-zero. If
325 * connecting to a virtual socket we generate a unique MAC.
327 if (info->tap_unit >= 0) {
328 if (ioctl(fd, TAPGIFINFO, &tapinfo) < 0) {
329 kprintf(VKE_DEVNAME "%d: ioctl(TAPGIFINFO) "
330 "failed: %s\n", unit, strerror(errno));
334 if (ioctl(fd, SIOCGIFADDR, enaddr) < 0) {
335 kprintf(VKE_DEVNAME "%d: ioctl(SIOCGIFADDR) "
336 "failed: %s\n", unit, strerror(errno));
340 int fd = open("/dev/urandom", O_RDONLY);
342 read(fd, enaddr + 2, 4);
345 enaddr[4] = (int)getpid() >> 8;
346 enaddr[5] = (int)getpid() & 255;
351 sc = kmalloc(sizeof(*sc), M_DEVBUF, M_WAITOK | M_ZERO);
353 sc->sc_txbuf = kmalloc(MCLBYTES, M_DEVBUF, M_WAITOK);
356 sc->sc_tap_unit = info->tap_unit;
357 sc->sc_addr = info->netif_addr;
358 sc->sc_mask = info->netif_mask;
360 ifp = &sc->arpcom.ac_if;
361 if_initname(ifp, VKE_DEVNAME, sc->sc_unit);
363 /* NB: after if_initname() */
364 sysctl_ctx_init(&sc->sc_sysctl_ctx);
365 sc->sc_sysctl_tree = SYSCTL_ADD_NODE(&sc->sc_sysctl_ctx,
366 SYSCTL_STATIC_CHILDREN(_hw),
367 OID_AUTO, ifp->if_xname,
369 if (sc->sc_sysctl_tree == NULL) {
370 kprintf(VKE_DEVNAME "%d: can't add sysctl node\n", unit);
372 SYSCTL_ADD_INT(&sc->sc_sysctl_ctx,
373 SYSCTL_CHILDREN(sc->sc_sysctl_tree),
374 OID_AUTO, "tap_unit",
375 CTLFLAG_RD, &sc->sc_tap_unit, 0,
376 "Backend tap(4) unit");
380 ifp->if_ioctl = vke_ioctl;
381 ifp->if_start = vke_start;
382 ifp->if_init = vke_init;
383 ifp->if_mtu = tapinfo.mtu;
384 ifp->if_baudrate = tapinfo.baudrate;
385 ifp->if_flags = IFF_BROADCAST | IFF_SIMPLEX | IFF_MULTICAST;
386 ifq_set_maxlen(&ifp->if_snd, IFQ_MAXLEN);
387 ifq_set_ready(&ifp->if_snd);
391 ether_ifattach(ifp, enaddr, NULL);
393 if (bootverbose && sc->sc_addr != 0) {
394 if_printf(ifp, "pre-configured "
395 "address 0x%08x, netmask 0x%08x\n",
396 ntohl(sc->sc_addr), ntohl(sc->sc_mask));
403 vke_init_addr(struct ifnet *ifp, in_addr_t addr, in_addr_t mask)
405 struct ifaliasreq ifra;
406 struct sockaddr_in *sin;
409 ASSERT_SERIALIZED(ifp->if_serializer);
412 if_printf(ifp, "add pre-configured "
413 "address 0x%08x, netmask 0x%08x\n",
414 ntohl(addr), ntohl(mask));
417 bzero(&ifra, sizeof(ifra));
419 /* NB: no need to set ifaliasreq.ifra_name */
421 sin = (struct sockaddr_in *)&ifra.ifra_addr;
422 sin->sin_family = AF_INET;
423 sin->sin_len = sizeof(*sin);
424 sin->sin_addr.s_addr = addr;
427 sin = (struct sockaddr_in *)&ifra.ifra_mask;
428 sin->sin_len = sizeof(*sin);
429 sin->sin_addr.s_addr = mask;
433 * Temporarily release serializer, in_control() will hold
434 * it again before calling ifnet.if_ioctl().
436 ifnet_deserialize_all(ifp);
437 ret = in_control(NULL, SIOCAIFADDR, (caddr_t)&ifra, ifp, NULL);
438 ifnet_serialize_all(ifp);