netmap_virt.h (341477) | netmap_virt.h (342033) |
---|---|
1/* 2 * Copyright (C) 2013-2016 Luigi Rizzo 3 * Copyright (C) 2013-2016 Giuseppe Lettieri | 1/* 2 * Copyright (C) 2013-2016 Luigi Rizzo 3 * Copyright (C) 2013-2016 Giuseppe Lettieri |
4 * Copyright (C) 2013-2016 Vincenzo Maffione | 4 * Copyright (C) 2013-2018 Vincenzo Maffione |
5 * Copyright (C) 2015 Stefano Garzarella 6 * All rights reserved. 7 * 8 * Redistribution and use in source and binary forms, with or without 9 * modification, are permitted provided that the following conditions 10 * are met: 11 * 1. Redistributions of source code must retain the above copyright 12 * notice, this list of conditions and the following disclaimer. --- 8 unchanged lines hidden (view full) --- 21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 27 * SUCH DAMAGE. 28 * | 5 * Copyright (C) 2015 Stefano Garzarella 6 * All rights reserved. 7 * 8 * Redistribution and use in source and binary forms, with or without 9 * modification, are permitted provided that the following conditions 10 * are met: 11 * 1. Redistributions of source code must retain the above copyright 12 * notice, this list of conditions and the following disclaimer. --- 8 unchanged lines hidden (view full) --- 21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 27 * SUCH DAMAGE. 28 * |
29 * $FreeBSD: stable/11/sys/net/netmap_virt.h 341477 2018-12-04 17:40:56Z vmaffione $ | 29 * $FreeBSD: stable/11/sys/net/netmap_virt.h 342033 2018-12-13 10:13:29Z vmaffione $ |
30 */ 31 32#ifndef NETMAP_VIRT_H 33#define NETMAP_VIRT_H 34 35/* | 30 */ 31 32#ifndef NETMAP_VIRT_H 33#define NETMAP_VIRT_H 34 35/* |
36 * ptnetmap_memdev: device used to expose memory into the guest VM | 36 * Register offsets and other macros for the ptnetmap paravirtual devices: 37 * ptnetmap-memdev: device used to expose memory into the guest 38 * ptnet: paravirtualized NIC exposing a netmap port in the guest |
37 * 38 * These macros are used in the hypervisor frontend (QEMU, bhyve) and in the 39 * guest device driver. 40 */ 41 | 39 * 40 * These macros are used in the hypervisor frontend (QEMU, bhyve) and in the 41 * guest device driver. 42 */ 43 |
42/* PCI identifiers and PCI BARs for the ptnetmap memdev 43 * and ptnetmap network interface. */ | 44/* PCI identifiers and PCI BARs for ptnetmap-memdev and ptnet. */ |
44#define PTNETMAP_MEMDEV_NAME "ptnetmap-memdev" 45#define PTNETMAP_PCI_VENDOR_ID 0x1b36 /* QEMU virtual devices */ 46#define PTNETMAP_PCI_DEVICE_ID 0x000c /* memory device */ 47#define PTNETMAP_PCI_NETIF_ID 0x000d /* ptnet network interface */ 48#define PTNETMAP_IO_PCI_BAR 0 49#define PTNETMAP_MEM_PCI_BAR 1 50#define PTNETMAP_MSIX_PCI_BAR 2 51 | 45#define PTNETMAP_MEMDEV_NAME "ptnetmap-memdev" 46#define PTNETMAP_PCI_VENDOR_ID 0x1b36 /* QEMU virtual devices */ 47#define PTNETMAP_PCI_DEVICE_ID 0x000c /* memory device */ 48#define PTNETMAP_PCI_NETIF_ID 0x000d /* ptnet network interface */ 49#define PTNETMAP_IO_PCI_BAR 0 50#define PTNETMAP_MEM_PCI_BAR 1 51#define PTNETMAP_MSIX_PCI_BAR 2 52 |
52/* Registers for the ptnetmap memdev */ | 53/* Device registers for ptnetmap-memdev */ |
53#define PTNET_MDEV_IO_MEMSIZE_LO 0 /* netmap memory size (low) */ 54#define PTNET_MDEV_IO_MEMSIZE_HI 4 /* netmap_memory_size (high) */ 55#define PTNET_MDEV_IO_MEMID 8 /* memory allocator ID in the host */ 56#define PTNET_MDEV_IO_IF_POOL_OFS 64 57#define PTNET_MDEV_IO_IF_POOL_OBJNUM 68 58#define PTNET_MDEV_IO_IF_POOL_OBJSZ 72 59#define PTNET_MDEV_IO_RING_POOL_OFS 76 60#define PTNET_MDEV_IO_RING_POOL_OBJNUM 80 61#define PTNET_MDEV_IO_RING_POOL_OBJSZ 84 62#define PTNET_MDEV_IO_BUF_POOL_OFS 88 63#define PTNET_MDEV_IO_BUF_POOL_OBJNUM 92 64#define PTNET_MDEV_IO_BUF_POOL_OBJSZ 96 65#define PTNET_MDEV_IO_END 100 66 | 54#define PTNET_MDEV_IO_MEMSIZE_LO 0 /* netmap memory size (low) */ 55#define PTNET_MDEV_IO_MEMSIZE_HI 4 /* netmap_memory_size (high) */ 56#define PTNET_MDEV_IO_MEMID 8 /* memory allocator ID in the host */ 57#define PTNET_MDEV_IO_IF_POOL_OFS 64 58#define PTNET_MDEV_IO_IF_POOL_OBJNUM 68 59#define PTNET_MDEV_IO_IF_POOL_OBJSZ 72 60#define PTNET_MDEV_IO_RING_POOL_OFS 76 61#define PTNET_MDEV_IO_RING_POOL_OBJNUM 80 62#define PTNET_MDEV_IO_RING_POOL_OBJSZ 84 63#define PTNET_MDEV_IO_BUF_POOL_OFS 88 64#define PTNET_MDEV_IO_BUF_POOL_OBJNUM 92 65#define PTNET_MDEV_IO_BUF_POOL_OBJSZ 96 66#define PTNET_MDEV_IO_END 100 67 |
67/* 68 * ptnetmap configuration 69 * 70 * The ptnet kthreads (running in host kernel-space) need to be configured 71 * in order to know how to intercept guest kicks (I/O register writes) and 72 * how to inject MSI-X interrupts to the guest. The configuration may vary 73 * depending on the hypervisor. Currently, we support QEMU/KVM on Linux and 74 * and bhyve on FreeBSD. 75 * The configuration is passed by the hypervisor to the host netmap module 76 * by means of an ioctl() with nr_cmd=NETMAP_PT_HOST_CREATE, and it is 77 * specified by the ptnetmap_cfg struct. This struct contains an header 78 * with general informations and an array of entries whose size depends 79 * on the hypervisor. The NETMAP_PT_HOST_CREATE command is issued every 80 * time the kthreads are started. 81 */ 82struct ptnetmap_cfg { 83#define PTNETMAP_CFGTYPE_QEMU 0x1 84#define PTNETMAP_CFGTYPE_BHYVE 0x2 85 uint16_t cfgtype; /* how to interpret the cfg entries */ 86 uint16_t entry_size; /* size of a config entry */ 87 uint32_t num_rings; /* number of config entries */ 88 void *csb_gh; /* CSB for guest --> host communication */ 89 void *csb_hg; /* CSB for host --> guest communication */ 90 /* Configuration entries are allocated right after the struct. */ 91}; 92 93/* Configuration of a ptnetmap ring for QEMU. */ 94struct ptnetmap_cfgentry_qemu { 95 uint32_t ioeventfd; /* to intercept guest register access */ 96 uint32_t irqfd; /* to inject guest interrupts */ 97}; 98 99/* Configuration of a ptnetmap ring for bhyve. */ 100struct ptnetmap_cfgentry_bhyve { 101 uint64_t wchan; /* tsleep() parameter, to wake up kthread */ 102 uint32_t ioctl_fd; /* ioctl fd */ 103 /* ioctl parameters to send irq */ 104 uint32_t ioctl_cmd; 105 /* vmm.ko MSIX parameters for IOCTL */ 106 struct { 107 uint64_t msg_data; 108 uint64_t addr; 109 } ioctl_data; 110}; 111 112/* 113 * Pass a pointer to a userspace buffer to be passed to kernelspace for write 114 * or read. Used by NETMAP_PT_HOST_CREATE. 115 * XXX deprecated 116 */ 117static inline void 118nmreq_pointer_put(struct nmreq *nmr, void *userptr) 119{ 120 uintptr_t *pp = (uintptr_t *)&nmr->nr_arg1; 121 *pp = (uintptr_t)userptr; 122} 123 124static inline void * 125nmreq_pointer_get(const struct nmreq *nmr) 126{ 127 const uintptr_t *pp = (const uintptr_t *)&nmr->nr_arg1; 128 return (void *)*pp; 129} 130 | |
131/* ptnetmap features */ 132#define PTNETMAP_F_VNET_HDR 1 133 | 68/* ptnetmap features */ 69#define PTNETMAP_F_VNET_HDR 1 70 |
134/* I/O registers for the ptnet device. */ | 71/* Device registers for the ptnet network device. */ |
135#define PTNET_IO_PTFEAT 0 136#define PTNET_IO_PTCTL 4 137#define PTNET_IO_MAC_LO 8 138#define PTNET_IO_MAC_HI 12 139#define PTNET_IO_CSBBAH 16 /* deprecated */ 140#define PTNET_IO_CSBBAL 20 /* deprecated */ 141#define PTNET_IO_NIFP_OFS 24 142#define PTNET_IO_NUM_TX_RINGS 28 --- 5 unchanged lines hidden (view full) --- 148#define PTNET_IO_CSB_GH_BAH 52 149#define PTNET_IO_CSB_GH_BAL 56 150#define PTNET_IO_CSB_HG_BAH 60 151#define PTNET_IO_CSB_HG_BAL 64 152#define PTNET_IO_END 68 153#define PTNET_IO_KICK_BASE 128 154#define PTNET_IO_MASK 0xff 155 | 72#define PTNET_IO_PTFEAT 0 73#define PTNET_IO_PTCTL 4 74#define PTNET_IO_MAC_LO 8 75#define PTNET_IO_MAC_HI 12 76#define PTNET_IO_CSBBAH 16 /* deprecated */ 77#define PTNET_IO_CSBBAL 20 /* deprecated */ 78#define PTNET_IO_NIFP_OFS 24 79#define PTNET_IO_NUM_TX_RINGS 28 --- 5 unchanged lines hidden (view full) --- 85#define PTNET_IO_CSB_GH_BAH 52 86#define PTNET_IO_CSB_GH_BAL 56 87#define PTNET_IO_CSB_HG_BAH 60 88#define PTNET_IO_CSB_HG_BAL 64 89#define PTNET_IO_END 68 90#define PTNET_IO_KICK_BASE 128 91#define PTNET_IO_MASK 0xff 92 |
156/* ptnetmap control commands (values for PTCTL register) */ | 93/* ptnet control commands (values for PTCTL register): 94 * - CREATE starts the host sync-kloop 95 * - DELETE stops the host sync-kloop 96 */ |
157#define PTNETMAP_PTCTL_CREATE 1 158#define PTNETMAP_PTCTL_DELETE 2 159 | 97#define PTNETMAP_PTCTL_CREATE 1 98#define PTNETMAP_PTCTL_DELETE 2 99 |
160/* ptnetmap synchronization variables shared between guest and host */ 161struct ptnet_csb_gh { 162 uint32_t head; /* GW+ HR+ the head of the guest netmap_ring */ 163 uint32_t cur; /* GW+ HR+ the cur of the guest netmap_ring */ 164 uint32_t guest_need_kick; /* GW+ HR+ host-->guest notification enable */ 165 uint32_t sync_flags; /* GW+ HR+ the flags of the guest [tx|rx]sync() */ 166 char pad[48]; /* pad to a 64 bytes cacheline */ 167}; 168struct ptnet_csb_hg { 169 uint32_t hwcur; /* GR+ HW+ the hwcur of the host netmap_kring */ 170 uint32_t hwtail; /* GR+ HW+ the hwtail of the host netmap_kring */ 171 uint32_t host_need_kick; /* GR+ HW+ guest-->host notification enable */ 172 char pad[4+48]; 173}; 174 175#ifdef WITH_PTNETMAP_GUEST 176 177/* ptnetmap_memdev routines used to talk with ptnetmap_memdev device driver */ 178struct ptnetmap_memdev; 179int nm_os_pt_memdev_iomap(struct ptnetmap_memdev *, vm_paddr_t *, void **, 180 uint64_t *); 181void nm_os_pt_memdev_iounmap(struct ptnetmap_memdev *); 182uint32_t nm_os_pt_memdev_ioread(struct ptnetmap_memdev *, unsigned int); 183 184/* Guest driver: Write kring pointers (cur, head) to the CSB. 185 * This routine is coupled with ptnetmap_host_read_kring_csb(). */ 186static inline void 187ptnetmap_guest_write_kring_csb(struct ptnet_csb_gh *ptr, uint32_t cur, 188 uint32_t head) 189{ 190 /* 191 * We need to write cur and head to the CSB but we cannot do it atomically. 192 * There is no way we can prevent the host from reading the updated value 193 * of one of the two and the old value of the other. However, if we make 194 * sure that the host never reads a value of head more recent than the 195 * value of cur we are safe. We can allow the host to read a value of cur 196 * more recent than the value of head, since in the netmap ring cur can be 197 * ahead of head and cur cannot wrap around head because it must be behind 198 * tail. Inverting the order of writes below could instead result into the 199 * host to think head went ahead of cur, which would cause the sync 200 * prologue to fail. 201 * 202 * The following memory barrier scheme is used to make this happen: 203 * 204 * Guest Host 205 * 206 * STORE(cur) LOAD(head) 207 * mb() <-----------> mb() 208 * STORE(head) LOAD(cur) 209 */ 210 ptr->cur = cur; 211 mb(); 212 ptr->head = head; 213} 214 215/* Guest driver: Read kring pointers (hwcur, hwtail) from the CSB. 216 * This routine is coupled with ptnetmap_host_write_kring_csb(). */ 217static inline void 218ptnetmap_guest_read_kring_csb(struct ptnet_csb_hg *pthg, struct netmap_kring *kring) 219{ 220 /* 221 * We place a memory barrier to make sure that the update of hwtail never 222 * overtakes the update of hwcur. 223 * (see explanation in ptnetmap_host_write_kring_csb). 224 */ 225 kring->nr_hwtail = pthg->hwtail; 226 mb(); 227 kring->nr_hwcur = pthg->hwcur; 228} 229 230#endif /* WITH_PTNETMAP_GUEST */ 231 232#ifdef WITH_PTNETMAP_HOST 233/* 234 * ptnetmap kernel thread routines 235 * */ 236 237/* Functions to read and write CSB fields in the host */ 238#if defined (linux) 239#define CSB_READ(csb, field, r) (get_user(r, &csb->field)) 240#define CSB_WRITE(csb, field, v) (put_user(v, &csb->field)) 241#else /* ! linux */ 242#define CSB_READ(csb, field, r) (r = fuword32(&csb->field)) 243#define CSB_WRITE(csb, field, v) (suword32(&csb->field, v)) 244#endif /* ! linux */ 245 246/* Host netmap: Write kring pointers (hwcur, hwtail) to the CSB. 247 * This routine is coupled with ptnetmap_guest_read_kring_csb(). */ 248static inline void 249ptnetmap_host_write_kring_csb(struct ptnet_csb_hg __user *ptr, uint32_t hwcur, 250 uint32_t hwtail) 251{ 252 /* 253 * The same scheme used in ptnetmap_guest_write_kring_csb() applies here. 254 * We allow the guest to read a value of hwcur more recent than the value 255 * of hwtail, since this would anyway result in a consistent view of the 256 * ring state (and hwcur can never wraparound hwtail, since hwcur must be 257 * behind head). 258 * 259 * The following memory barrier scheme is used to make this happen: 260 * 261 * Guest Host 262 * 263 * STORE(hwcur) LOAD(hwtail) 264 * mb() <-------------> mb() 265 * STORE(hwtail) LOAD(hwcur) 266 */ 267 CSB_WRITE(ptr, hwcur, hwcur); 268 mb(); 269 CSB_WRITE(ptr, hwtail, hwtail); 270} 271 272/* Host netmap: Read kring pointers (head, cur, sync_flags) from the CSB. 273 * This routine is coupled with ptnetmap_guest_write_kring_csb(). */ 274static inline void 275ptnetmap_host_read_kring_csb(struct ptnet_csb_gh __user *ptr, 276 struct netmap_ring *shadow_ring, 277 uint32_t num_slots) 278{ 279 /* 280 * We place a memory barrier to make sure that the update of head never 281 * overtakes the update of cur. 282 * (see explanation in ptnetmap_guest_write_kring_csb). 283 */ 284 CSB_READ(ptr, head, shadow_ring->head); 285 mb(); 286 CSB_READ(ptr, cur, shadow_ring->cur); 287 CSB_READ(ptr, sync_flags, shadow_ring->flags); 288} 289 290#endif /* WITH_PTNETMAP_HOST */ 291 | |
292#endif /* NETMAP_VIRT_H */ | 100#endif /* NETMAP_VIRT_H */ |