| .. | .. |
|---|
| 1 | +// SPDX-License-Identifier: GPL-2.0-only |
|---|
| 1 | 2 | /**************************************************************************** |
|---|
| 2 | 3 | * Driver for Solarflare network controllers and boards |
|---|
| 3 | 4 | * Copyright 2005-2006 Fen Systems Ltd. |
|---|
| 4 | 5 | * Copyright 2005-2013 Solarflare Communications Inc. |
|---|
| 5 | | - * |
|---|
| 6 | | - * This program is free software; you can redistribute it and/or modify it |
|---|
| 7 | | - * under the terms of the GNU General Public License version 2 as published |
|---|
| 8 | | - * by the Free Software Foundation, incorporated herein by reference. |
|---|
| 9 | 6 | */ |
|---|
| 10 | 7 | |
|---|
| 11 | 8 | #include <linux/socket.h> |
|---|
| .. | .. |
|---|
| 20 | 17 | #include <linux/iommu.h> |
|---|
| 21 | 18 | #include <net/ip.h> |
|---|
| 22 | 19 | #include <net/checksum.h> |
|---|
| 20 | +#include <net/xdp.h> |
|---|
| 21 | +#include <linux/bpf_trace.h> |
|---|
| 23 | 22 | #include "net_driver.h" |
|---|
| 24 | 23 | #include "efx.h" |
|---|
| 24 | +#include "rx_common.h" |
|---|
| 25 | 25 | #include "filter.h" |
|---|
| 26 | 26 | #include "nic.h" |
|---|
| 27 | 27 | #include "selftest.h" |
|---|
| .. | .. |
|---|
| 30 | 30 | /* Preferred number of descriptors to fill at once */ |
|---|
| 31 | 31 | #define EFX_RX_PREFERRED_BATCH 8U |
|---|
| 32 | 32 | |
|---|
| 33 | | -/* Number of RX buffers to recycle pages for. When creating the RX page recycle |
|---|
| 34 | | - * ring, this number is divided by the number of buffers per page to calculate |
|---|
| 35 | | - * the number of pages to store in the RX page recycle ring. |
|---|
| 36 | | - */ |
|---|
| 37 | | -#define EFX_RECYCLE_RING_SIZE_IOMMU 4096 |
|---|
| 38 | | -#define EFX_RECYCLE_RING_SIZE_NOIOMMU (2 * EFX_RX_PREFERRED_BATCH) |
|---|
| 33 | +/* Maximum rx prefix used by any architecture. */ |
|---|
| 34 | +#define EFX_MAX_RX_PREFIX_SIZE 16 |
|---|
| 39 | 35 | |
|---|
| 40 | 36 | /* Size of buffer allocated for skb header area. */ |
|---|
| 41 | 37 | #define EFX_SKB_HEADERS 128u |
|---|
| 42 | 38 | |
|---|
| 43 | | -/* This is the percentage fill level below which new RX descriptors |
|---|
| 44 | | - * will be added to the RX descriptor ring. |
|---|
| 45 | | - */ |
|---|
| 46 | | -static unsigned int rx_refill_threshold; |
|---|
| 47 | | - |
|---|
| 48 | 39 | /* Each packet can consume up to ceil(max_frame_len / buffer_size) buffers */ |
|---|
| 49 | 40 | #define EFX_RX_MAX_FRAGS DIV_ROUND_UP(EFX_MAX_FRAME_LEN(EFX_MAX_MTU), \ |
|---|
| 50 | 41 | EFX_RX_USR_BUF_SIZE) |
|---|
| 51 | | - |
|---|
| 52 | | -/* |
|---|
| 53 | | - * RX maximum head room required. |
|---|
| 54 | | - * |
|---|
| 55 | | - * This must be at least 1 to prevent overflow, plus one packet-worth |
|---|
| 56 | | - * to allow pipelined receives. |
|---|
| 57 | | - */ |
|---|
| 58 | | -#define EFX_RXD_HEAD_ROOM (1 + EFX_RX_MAX_FRAGS) |
|---|
| 59 | | - |
|---|
| 60 | | -static inline u8 *efx_rx_buf_va(struct efx_rx_buffer *buf) |
|---|
| 61 | | -{ |
|---|
| 62 | | - return page_address(buf->page) + buf->page_offset; |
|---|
| 63 | | -} |
|---|
| 64 | | - |
|---|
| 65 | | -static inline u32 efx_rx_buf_hash(struct efx_nic *efx, const u8 *eh) |
|---|
| 66 | | -{ |
|---|
| 67 | | -#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) |
|---|
| 68 | | - return __le32_to_cpup((const __le32 *)(eh + efx->rx_packet_hash_offset)); |
|---|
| 69 | | -#else |
|---|
| 70 | | - const u8 *data = eh + efx->rx_packet_hash_offset; |
|---|
| 71 | | - return (u32)data[0] | |
|---|
| 72 | | - (u32)data[1] << 8 | |
|---|
| 73 | | - (u32)data[2] << 16 | |
|---|
| 74 | | - (u32)data[3] << 24; |
|---|
| 75 | | -#endif |
|---|
| 76 | | -} |
|---|
| 77 | | - |
|---|
| 78 | | -static inline struct efx_rx_buffer * |
|---|
| 79 | | -efx_rx_buf_next(struct efx_rx_queue *rx_queue, struct efx_rx_buffer *rx_buf) |
|---|
| 80 | | -{ |
|---|
| 81 | | - if (unlikely(rx_buf == efx_rx_buffer(rx_queue, rx_queue->ptr_mask))) |
|---|
| 82 | | - return efx_rx_buffer(rx_queue, 0); |
|---|
| 83 | | - else |
|---|
| 84 | | - return rx_buf + 1; |
|---|
| 85 | | -} |
|---|
| 86 | | - |
|---|
| 87 | | -static inline void efx_sync_rx_buffer(struct efx_nic *efx, |
|---|
| 88 | | - struct efx_rx_buffer *rx_buf, |
|---|
| 89 | | - unsigned int len) |
|---|
| 90 | | -{ |
|---|
| 91 | | - dma_sync_single_for_cpu(&efx->pci_dev->dev, rx_buf->dma_addr, len, |
|---|
| 92 | | - DMA_FROM_DEVICE); |
|---|
| 93 | | -} |
|---|
| 94 | | - |
|---|
| 95 | | -void efx_rx_config_page_split(struct efx_nic *efx) |
|---|
| 96 | | -{ |
|---|
| 97 | | - efx->rx_page_buf_step = ALIGN(efx->rx_dma_len + efx->rx_ip_align, |
|---|
| 98 | | - EFX_RX_BUF_ALIGNMENT); |
|---|
| 99 | | - efx->rx_bufs_per_page = efx->rx_buffer_order ? 1 : |
|---|
| 100 | | - ((PAGE_SIZE - sizeof(struct efx_rx_page_state)) / |
|---|
| 101 | | - efx->rx_page_buf_step); |
|---|
| 102 | | - efx->rx_buffer_truesize = (PAGE_SIZE << efx->rx_buffer_order) / |
|---|
| 103 | | - efx->rx_bufs_per_page; |
|---|
| 104 | | - efx->rx_pages_per_batch = DIV_ROUND_UP(EFX_RX_PREFERRED_BATCH, |
|---|
| 105 | | - efx->rx_bufs_per_page); |
|---|
| 106 | | -} |
|---|
| 107 | | - |
|---|
| 108 | | -/* Check the RX page recycle ring for a page that can be reused. */ |
|---|
| 109 | | -static struct page *efx_reuse_page(struct efx_rx_queue *rx_queue) |
|---|
| 110 | | -{ |
|---|
| 111 | | - struct efx_nic *efx = rx_queue->efx; |
|---|
| 112 | | - struct page *page; |
|---|
| 113 | | - struct efx_rx_page_state *state; |
|---|
| 114 | | - unsigned index; |
|---|
| 115 | | - |
|---|
| 116 | | - index = rx_queue->page_remove & rx_queue->page_ptr_mask; |
|---|
| 117 | | - page = rx_queue->page_ring[index]; |
|---|
| 118 | | - if (page == NULL) |
|---|
| 119 | | - return NULL; |
|---|
| 120 | | - |
|---|
| 121 | | - rx_queue->page_ring[index] = NULL; |
|---|
| 122 | | - /* page_remove cannot exceed page_add. */ |
|---|
| 123 | | - if (rx_queue->page_remove != rx_queue->page_add) |
|---|
| 124 | | - ++rx_queue->page_remove; |
|---|
| 125 | | - |
|---|
| 126 | | - /* If page_count is 1 then we hold the only reference to this page. */ |
|---|
| 127 | | - if (page_count(page) == 1) { |
|---|
| 128 | | - ++rx_queue->page_recycle_count; |
|---|
| 129 | | - return page; |
|---|
| 130 | | - } else { |
|---|
| 131 | | - state = page_address(page); |
|---|
| 132 | | - dma_unmap_page(&efx->pci_dev->dev, state->dma_addr, |
|---|
| 133 | | - PAGE_SIZE << efx->rx_buffer_order, |
|---|
| 134 | | - DMA_FROM_DEVICE); |
|---|
| 135 | | - put_page(page); |
|---|
| 136 | | - ++rx_queue->page_recycle_failed; |
|---|
| 137 | | - } |
|---|
| 138 | | - |
|---|
| 139 | | - return NULL; |
|---|
| 140 | | -} |
|---|
| 141 | | - |
|---|
| 142 | | -/** |
|---|
| 143 | | - * efx_init_rx_buffers - create EFX_RX_BATCH page-based RX buffers |
|---|
| 144 | | - * |
|---|
| 145 | | - * @rx_queue: Efx RX queue |
|---|
| 146 | | - * |
|---|
| 147 | | - * This allocates a batch of pages, maps them for DMA, and populates |
|---|
| 148 | | - * struct efx_rx_buffers for each one. Return a negative error code or |
|---|
| 149 | | - * 0 on success. If a single page can be used for multiple buffers, |
|---|
| 150 | | - * then the page will either be inserted fully, or not at all. |
|---|
| 151 | | - */ |
|---|
| 152 | | -static int efx_init_rx_buffers(struct efx_rx_queue *rx_queue, bool atomic) |
|---|
| 153 | | -{ |
|---|
| 154 | | - struct efx_nic *efx = rx_queue->efx; |
|---|
| 155 | | - struct efx_rx_buffer *rx_buf; |
|---|
| 156 | | - struct page *page; |
|---|
| 157 | | - unsigned int page_offset; |
|---|
| 158 | | - struct efx_rx_page_state *state; |
|---|
| 159 | | - dma_addr_t dma_addr; |
|---|
| 160 | | - unsigned index, count; |
|---|
| 161 | | - |
|---|
| 162 | | - count = 0; |
|---|
| 163 | | - do { |
|---|
| 164 | | - page = efx_reuse_page(rx_queue); |
|---|
| 165 | | - if (page == NULL) { |
|---|
| 166 | | - page = alloc_pages(__GFP_COMP | |
|---|
| 167 | | - (atomic ? GFP_ATOMIC : GFP_KERNEL), |
|---|
| 168 | | - efx->rx_buffer_order); |
|---|
| 169 | | - if (unlikely(page == NULL)) |
|---|
| 170 | | - return -ENOMEM; |
|---|
| 171 | | - dma_addr = |
|---|
| 172 | | - dma_map_page(&efx->pci_dev->dev, page, 0, |
|---|
| 173 | | - PAGE_SIZE << efx->rx_buffer_order, |
|---|
| 174 | | - DMA_FROM_DEVICE); |
|---|
| 175 | | - if (unlikely(dma_mapping_error(&efx->pci_dev->dev, |
|---|
| 176 | | - dma_addr))) { |
|---|
| 177 | | - __free_pages(page, efx->rx_buffer_order); |
|---|
| 178 | | - return -EIO; |
|---|
| 179 | | - } |
|---|
| 180 | | - state = page_address(page); |
|---|
| 181 | | - state->dma_addr = dma_addr; |
|---|
| 182 | | - } else { |
|---|
| 183 | | - state = page_address(page); |
|---|
| 184 | | - dma_addr = state->dma_addr; |
|---|
| 185 | | - } |
|---|
| 186 | | - |
|---|
| 187 | | - dma_addr += sizeof(struct efx_rx_page_state); |
|---|
| 188 | | - page_offset = sizeof(struct efx_rx_page_state); |
|---|
| 189 | | - |
|---|
| 190 | | - do { |
|---|
| 191 | | - index = rx_queue->added_count & rx_queue->ptr_mask; |
|---|
| 192 | | - rx_buf = efx_rx_buffer(rx_queue, index); |
|---|
| 193 | | - rx_buf->dma_addr = dma_addr + efx->rx_ip_align; |
|---|
| 194 | | - rx_buf->page = page; |
|---|
| 195 | | - rx_buf->page_offset = page_offset + efx->rx_ip_align; |
|---|
| 196 | | - rx_buf->len = efx->rx_dma_len; |
|---|
| 197 | | - rx_buf->flags = 0; |
|---|
| 198 | | - ++rx_queue->added_count; |
|---|
| 199 | | - get_page(page); |
|---|
| 200 | | - dma_addr += efx->rx_page_buf_step; |
|---|
| 201 | | - page_offset += efx->rx_page_buf_step; |
|---|
| 202 | | - } while (page_offset + efx->rx_page_buf_step <= PAGE_SIZE); |
|---|
| 203 | | - |
|---|
| 204 | | - rx_buf->flags = EFX_RX_BUF_LAST_IN_PAGE; |
|---|
| 205 | | - } while (++count < efx->rx_pages_per_batch); |
|---|
| 206 | | - |
|---|
| 207 | | - return 0; |
|---|
| 208 | | -} |
|---|
| 209 | | - |
|---|
| 210 | | -/* Unmap a DMA-mapped page. This function is only called for the final RX |
|---|
| 211 | | - * buffer in a page. |
|---|
| 212 | | - */ |
|---|
| 213 | | -static void efx_unmap_rx_buffer(struct efx_nic *efx, |
|---|
| 214 | | - struct efx_rx_buffer *rx_buf) |
|---|
| 215 | | -{ |
|---|
| 216 | | - struct page *page = rx_buf->page; |
|---|
| 217 | | - |
|---|
| 218 | | - if (page) { |
|---|
| 219 | | - struct efx_rx_page_state *state = page_address(page); |
|---|
| 220 | | - dma_unmap_page(&efx->pci_dev->dev, |
|---|
| 221 | | - state->dma_addr, |
|---|
| 222 | | - PAGE_SIZE << efx->rx_buffer_order, |
|---|
| 223 | | - DMA_FROM_DEVICE); |
|---|
| 224 | | - } |
|---|
| 225 | | -} |
|---|
| 226 | | - |
|---|
| 227 | | -static void efx_free_rx_buffers(struct efx_rx_queue *rx_queue, |
|---|
| 228 | | - struct efx_rx_buffer *rx_buf, |
|---|
| 229 | | - unsigned int num_bufs) |
|---|
| 230 | | -{ |
|---|
| 231 | | - do { |
|---|
| 232 | | - if (rx_buf->page) { |
|---|
| 233 | | - put_page(rx_buf->page); |
|---|
| 234 | | - rx_buf->page = NULL; |
|---|
| 235 | | - } |
|---|
| 236 | | - rx_buf = efx_rx_buf_next(rx_queue, rx_buf); |
|---|
| 237 | | - } while (--num_bufs); |
|---|
| 238 | | -} |
|---|
| 239 | | - |
|---|
| 240 | | -/* Attempt to recycle the page if there is an RX recycle ring; the page can |
|---|
| 241 | | - * only be added if this is the final RX buffer, to prevent pages being used in |
|---|
| 242 | | - * the descriptor ring and appearing in the recycle ring simultaneously. |
|---|
| 243 | | - */ |
|---|
| 244 | | -static void efx_recycle_rx_page(struct efx_channel *channel, |
|---|
| 245 | | - struct efx_rx_buffer *rx_buf) |
|---|
| 246 | | -{ |
|---|
| 247 | | - struct page *page = rx_buf->page; |
|---|
| 248 | | - struct efx_rx_queue *rx_queue = efx_channel_get_rx_queue(channel); |
|---|
| 249 | | - struct efx_nic *efx = rx_queue->efx; |
|---|
| 250 | | - unsigned index; |
|---|
| 251 | | - |
|---|
| 252 | | - /* Only recycle the page after processing the final buffer. */ |
|---|
| 253 | | - if (!(rx_buf->flags & EFX_RX_BUF_LAST_IN_PAGE)) |
|---|
| 254 | | - return; |
|---|
| 255 | | - |
|---|
| 256 | | - index = rx_queue->page_add & rx_queue->page_ptr_mask; |
|---|
| 257 | | - if (rx_queue->page_ring[index] == NULL) { |
|---|
| 258 | | - unsigned read_index = rx_queue->page_remove & |
|---|
| 259 | | - rx_queue->page_ptr_mask; |
|---|
| 260 | | - |
|---|
| 261 | | - /* The next slot in the recycle ring is available, but |
|---|
| 262 | | - * increment page_remove if the read pointer currently |
|---|
| 263 | | - * points here. |
|---|
| 264 | | - */ |
|---|
| 265 | | - if (read_index == index) |
|---|
| 266 | | - ++rx_queue->page_remove; |
|---|
| 267 | | - rx_queue->page_ring[index] = page; |
|---|
| 268 | | - ++rx_queue->page_add; |
|---|
| 269 | | - return; |
|---|
| 270 | | - } |
|---|
| 271 | | - ++rx_queue->page_recycle_full; |
|---|
| 272 | | - efx_unmap_rx_buffer(efx, rx_buf); |
|---|
| 273 | | - put_page(rx_buf->page); |
|---|
| 274 | | -} |
|---|
| 275 | | - |
|---|
| 276 | | -static void efx_fini_rx_buffer(struct efx_rx_queue *rx_queue, |
|---|
| 277 | | - struct efx_rx_buffer *rx_buf) |
|---|
| 278 | | -{ |
|---|
| 279 | | - /* Release the page reference we hold for the buffer. */ |
|---|
| 280 | | - if (rx_buf->page) |
|---|
| 281 | | - put_page(rx_buf->page); |
|---|
| 282 | | - |
|---|
| 283 | | - /* If this is the last buffer in a page, unmap and free it. */ |
|---|
| 284 | | - if (rx_buf->flags & EFX_RX_BUF_LAST_IN_PAGE) { |
|---|
| 285 | | - efx_unmap_rx_buffer(rx_queue->efx, rx_buf); |
|---|
| 286 | | - efx_free_rx_buffers(rx_queue, rx_buf, 1); |
|---|
| 287 | | - } |
|---|
| 288 | | - rx_buf->page = NULL; |
|---|
| 289 | | -} |
|---|
| 290 | | - |
|---|
| 291 | | -/* Recycle the pages that are used by buffers that have just been received. */ |
|---|
| 292 | | -static void efx_recycle_rx_pages(struct efx_channel *channel, |
|---|
| 293 | | - struct efx_rx_buffer *rx_buf, |
|---|
| 294 | | - unsigned int n_frags) |
|---|
| 295 | | -{ |
|---|
| 296 | | - struct efx_rx_queue *rx_queue = efx_channel_get_rx_queue(channel); |
|---|
| 297 | | - |
|---|
| 298 | | - do { |
|---|
| 299 | | - efx_recycle_rx_page(channel, rx_buf); |
|---|
| 300 | | - rx_buf = efx_rx_buf_next(rx_queue, rx_buf); |
|---|
| 301 | | - } while (--n_frags); |
|---|
| 302 | | -} |
|---|
| 303 | | - |
|---|
| 304 | | -static void efx_discard_rx_packet(struct efx_channel *channel, |
|---|
| 305 | | - struct efx_rx_buffer *rx_buf, |
|---|
| 306 | | - unsigned int n_frags) |
|---|
| 307 | | -{ |
|---|
| 308 | | - struct efx_rx_queue *rx_queue = efx_channel_get_rx_queue(channel); |
|---|
| 309 | | - |
|---|
| 310 | | - efx_recycle_rx_pages(channel, rx_buf, n_frags); |
|---|
| 311 | | - |
|---|
| 312 | | - efx_free_rx_buffers(rx_queue, rx_buf, n_frags); |
|---|
| 313 | | -} |
|---|
| 314 | | - |
|---|
| 315 | | -/** |
|---|
| 316 | | - * efx_fast_push_rx_descriptors - push new RX descriptors quickly |
|---|
| 317 | | - * @rx_queue: RX descriptor queue |
|---|
| 318 | | - * |
|---|
| 319 | | - * This will aim to fill the RX descriptor queue up to |
|---|
| 320 | | - * @rx_queue->@max_fill. If there is insufficient atomic |
|---|
| 321 | | - * memory to do so, a slow fill will be scheduled. |
|---|
| 322 | | - * |
|---|
| 323 | | - * The caller must provide serialisation (none is used here). In practise, |
|---|
| 324 | | - * this means this function must run from the NAPI handler, or be called |
|---|
| 325 | | - * when NAPI is disabled. |
|---|
| 326 | | - */ |
|---|
| 327 | | -void efx_fast_push_rx_descriptors(struct efx_rx_queue *rx_queue, bool atomic) |
|---|
| 328 | | -{ |
|---|
| 329 | | - struct efx_nic *efx = rx_queue->efx; |
|---|
| 330 | | - unsigned int fill_level, batch_size; |
|---|
| 331 | | - int space, rc = 0; |
|---|
| 332 | | - |
|---|
| 333 | | - if (!rx_queue->refill_enabled) |
|---|
| 334 | | - return; |
|---|
| 335 | | - |
|---|
| 336 | | - /* Calculate current fill level, and exit if we don't need to fill */ |
|---|
| 337 | | - fill_level = (rx_queue->added_count - rx_queue->removed_count); |
|---|
| 338 | | - EFX_WARN_ON_ONCE_PARANOID(fill_level > rx_queue->efx->rxq_entries); |
|---|
| 339 | | - if (fill_level >= rx_queue->fast_fill_trigger) |
|---|
| 340 | | - goto out; |
|---|
| 341 | | - |
|---|
| 342 | | - /* Record minimum fill level */ |
|---|
| 343 | | - if (unlikely(fill_level < rx_queue->min_fill)) { |
|---|
| 344 | | - if (fill_level) |
|---|
| 345 | | - rx_queue->min_fill = fill_level; |
|---|
| 346 | | - } |
|---|
| 347 | | - |
|---|
| 348 | | - batch_size = efx->rx_pages_per_batch * efx->rx_bufs_per_page; |
|---|
| 349 | | - space = rx_queue->max_fill - fill_level; |
|---|
| 350 | | - EFX_WARN_ON_ONCE_PARANOID(space < batch_size); |
|---|
| 351 | | - |
|---|
| 352 | | - netif_vdbg(rx_queue->efx, rx_status, rx_queue->efx->net_dev, |
|---|
| 353 | | - "RX queue %d fast-filling descriptor ring from" |
|---|
| 354 | | - " level %d to level %d\n", |
|---|
| 355 | | - efx_rx_queue_index(rx_queue), fill_level, |
|---|
| 356 | | - rx_queue->max_fill); |
|---|
| 357 | | - |
|---|
| 358 | | - |
|---|
| 359 | | - do { |
|---|
| 360 | | - rc = efx_init_rx_buffers(rx_queue, atomic); |
|---|
| 361 | | - if (unlikely(rc)) { |
|---|
| 362 | | - /* Ensure that we don't leave the rx queue empty */ |
|---|
| 363 | | - if (rx_queue->added_count == rx_queue->removed_count) |
|---|
| 364 | | - efx_schedule_slow_fill(rx_queue); |
|---|
| 365 | | - goto out; |
|---|
| 366 | | - } |
|---|
| 367 | | - } while ((space -= batch_size) >= batch_size); |
|---|
| 368 | | - |
|---|
| 369 | | - netif_vdbg(rx_queue->efx, rx_status, rx_queue->efx->net_dev, |
|---|
| 370 | | - "RX queue %d fast-filled descriptor ring " |
|---|
| 371 | | - "to level %d\n", efx_rx_queue_index(rx_queue), |
|---|
| 372 | | - rx_queue->added_count - rx_queue->removed_count); |
|---|
| 373 | | - |
|---|
| 374 | | - out: |
|---|
| 375 | | - if (rx_queue->notified_count != rx_queue->added_count) |
|---|
| 376 | | - efx_nic_notify_rx_desc(rx_queue); |
|---|
| 377 | | -} |
|---|
| 378 | | - |
|---|
| 379 | | -void efx_rx_slow_fill(struct timer_list *t) |
|---|
| 380 | | -{ |
|---|
| 381 | | - struct efx_rx_queue *rx_queue = from_timer(rx_queue, t, slow_fill); |
|---|
| 382 | | - |
|---|
| 383 | | - /* Post an event to cause NAPI to run and refill the queue */ |
|---|
| 384 | | - efx_nic_generate_fill_event(rx_queue); |
|---|
| 385 | | - ++rx_queue->slow_fill_count; |
|---|
| 386 | | -} |
|---|
| 387 | 42 | |
|---|
| 388 | 43 | static void efx_rx_packet__check_len(struct efx_rx_queue *rx_queue, |
|---|
| 389 | 44 | struct efx_rx_buffer *rx_buf, |
|---|
| .. | .. |
|---|
| 406 | 61 | efx_rx_queue_index(rx_queue), len, max_len); |
|---|
| 407 | 62 | |
|---|
| 408 | 63 | efx_rx_queue_channel(rx_queue)->n_rx_overlength++; |
|---|
| 409 | | -} |
|---|
| 410 | | - |
|---|
| 411 | | -/* Pass a received packet up through GRO. GRO can handle pages |
|---|
| 412 | | - * regardless of checksum state and skbs with a good checksum. |
|---|
| 413 | | - */ |
|---|
| 414 | | -static void |
|---|
| 415 | | -efx_rx_packet_gro(struct efx_channel *channel, struct efx_rx_buffer *rx_buf, |
|---|
| 416 | | - unsigned int n_frags, u8 *eh) |
|---|
| 417 | | -{ |
|---|
| 418 | | - struct napi_struct *napi = &channel->napi_str; |
|---|
| 419 | | - gro_result_t gro_result; |
|---|
| 420 | | - struct efx_nic *efx = channel->efx; |
|---|
| 421 | | - struct sk_buff *skb; |
|---|
| 422 | | - |
|---|
| 423 | | - skb = napi_get_frags(napi); |
|---|
| 424 | | - if (unlikely(!skb)) { |
|---|
| 425 | | - struct efx_rx_queue *rx_queue; |
|---|
| 426 | | - |
|---|
| 427 | | - rx_queue = efx_channel_get_rx_queue(channel); |
|---|
| 428 | | - efx_free_rx_buffers(rx_queue, rx_buf, n_frags); |
|---|
| 429 | | - return; |
|---|
| 430 | | - } |
|---|
| 431 | | - |
|---|
| 432 | | - if (efx->net_dev->features & NETIF_F_RXHASH) |
|---|
| 433 | | - skb_set_hash(skb, efx_rx_buf_hash(efx, eh), |
|---|
| 434 | | - PKT_HASH_TYPE_L3); |
|---|
| 435 | | - skb->ip_summed = ((rx_buf->flags & EFX_RX_PKT_CSUMMED) ? |
|---|
| 436 | | - CHECKSUM_UNNECESSARY : CHECKSUM_NONE); |
|---|
| 437 | | - skb->csum_level = !!(rx_buf->flags & EFX_RX_PKT_CSUM_LEVEL); |
|---|
| 438 | | - |
|---|
| 439 | | - for (;;) { |
|---|
| 440 | | - skb_fill_page_desc(skb, skb_shinfo(skb)->nr_frags, |
|---|
| 441 | | - rx_buf->page, rx_buf->page_offset, |
|---|
| 442 | | - rx_buf->len); |
|---|
| 443 | | - rx_buf->page = NULL; |
|---|
| 444 | | - skb->len += rx_buf->len; |
|---|
| 445 | | - if (skb_shinfo(skb)->nr_frags == n_frags) |
|---|
| 446 | | - break; |
|---|
| 447 | | - |
|---|
| 448 | | - rx_buf = efx_rx_buf_next(&channel->rx_queue, rx_buf); |
|---|
| 449 | | - } |
|---|
| 450 | | - |
|---|
| 451 | | - skb->data_len = skb->len; |
|---|
| 452 | | - skb->truesize += n_frags * efx->rx_buffer_truesize; |
|---|
| 453 | | - |
|---|
| 454 | | - skb_record_rx_queue(skb, channel->rx_queue.core_index); |
|---|
| 455 | | - |
|---|
| 456 | | - gro_result = napi_gro_frags(napi); |
|---|
| 457 | | - if (gro_result != GRO_DROP) |
|---|
| 458 | | - channel->irq_mod_score += 2; |
|---|
| 459 | 64 | } |
|---|
| 460 | 65 | |
|---|
| 461 | 66 | /* Allocate and construct an SKB around page fragments */ |
|---|
| .. | .. |
|---|
| 642 | 247 | netif_receive_skb(skb); |
|---|
| 643 | 248 | } |
|---|
| 644 | 249 | |
|---|
| 250 | +/** efx_do_xdp: perform XDP processing on a received packet |
|---|
| 251 | + * |
|---|
| 252 | + * Returns true if packet should still be delivered. |
|---|
| 253 | + */ |
|---|
| 254 | +static bool efx_do_xdp(struct efx_nic *efx, struct efx_channel *channel, |
|---|
| 255 | + struct efx_rx_buffer *rx_buf, u8 **ehp) |
|---|
| 256 | +{ |
|---|
| 257 | + u8 rx_prefix[EFX_MAX_RX_PREFIX_SIZE]; |
|---|
| 258 | + struct efx_rx_queue *rx_queue; |
|---|
| 259 | + struct bpf_prog *xdp_prog; |
|---|
| 260 | + struct xdp_frame *xdpf; |
|---|
| 261 | + struct xdp_buff xdp; |
|---|
| 262 | + u32 xdp_act; |
|---|
| 263 | + s16 offset; |
|---|
| 264 | + int err; |
|---|
| 265 | + |
|---|
| 266 | + rcu_read_lock(); |
|---|
| 267 | + xdp_prog = rcu_dereference(efx->xdp_prog); |
|---|
| 268 | + if (!xdp_prog) { |
|---|
| 269 | + rcu_read_unlock(); |
|---|
| 270 | + return true; |
|---|
| 271 | + } |
|---|
| 272 | + |
|---|
| 273 | + rx_queue = efx_channel_get_rx_queue(channel); |
|---|
| 274 | + |
|---|
| 275 | + if (unlikely(channel->rx_pkt_n_frags > 1)) { |
|---|
| 276 | + /* We can't do XDP on fragmented packets - drop. */ |
|---|
| 277 | + rcu_read_unlock(); |
|---|
| 278 | + efx_free_rx_buffers(rx_queue, rx_buf, |
|---|
| 279 | + channel->rx_pkt_n_frags); |
|---|
| 280 | + if (net_ratelimit()) |
|---|
| 281 | + netif_err(efx, rx_err, efx->net_dev, |
|---|
| 282 | + "XDP is not possible with multiple receive fragments (%d)\n", |
|---|
| 283 | + channel->rx_pkt_n_frags); |
|---|
| 284 | + channel->n_rx_xdp_bad_drops++; |
|---|
| 285 | + return false; |
|---|
| 286 | + } |
|---|
| 287 | + |
|---|
| 288 | + dma_sync_single_for_cpu(&efx->pci_dev->dev, rx_buf->dma_addr, |
|---|
| 289 | + rx_buf->len, DMA_FROM_DEVICE); |
|---|
| 290 | + |
|---|
| 291 | + /* Save the rx prefix. */ |
|---|
| 292 | + EFX_WARN_ON_PARANOID(efx->rx_prefix_size > EFX_MAX_RX_PREFIX_SIZE); |
|---|
| 293 | + memcpy(rx_prefix, *ehp - efx->rx_prefix_size, |
|---|
| 294 | + efx->rx_prefix_size); |
|---|
| 295 | + |
|---|
| 296 | + xdp.data = *ehp; |
|---|
| 297 | + xdp.data_hard_start = xdp.data - EFX_XDP_HEADROOM; |
|---|
| 298 | + |
|---|
| 299 | + /* No support yet for XDP metadata */ |
|---|
| 300 | + xdp_set_data_meta_invalid(&xdp); |
|---|
| 301 | + xdp.data_end = xdp.data + rx_buf->len; |
|---|
| 302 | + xdp.rxq = &rx_queue->xdp_rxq_info; |
|---|
| 303 | + xdp.frame_sz = efx->rx_page_buf_step; |
|---|
| 304 | + |
|---|
| 305 | + xdp_act = bpf_prog_run_xdp(xdp_prog, &xdp); |
|---|
| 306 | + rcu_read_unlock(); |
|---|
| 307 | + |
|---|
| 308 | + offset = (u8 *)xdp.data - *ehp; |
|---|
| 309 | + |
|---|
| 310 | + switch (xdp_act) { |
|---|
| 311 | + case XDP_PASS: |
|---|
| 312 | + /* Fix up rx prefix. */ |
|---|
| 313 | + if (offset) { |
|---|
| 314 | + *ehp += offset; |
|---|
| 315 | + rx_buf->page_offset += offset; |
|---|
| 316 | + rx_buf->len -= offset; |
|---|
| 317 | + memcpy(*ehp - efx->rx_prefix_size, rx_prefix, |
|---|
| 318 | + efx->rx_prefix_size); |
|---|
| 319 | + } |
|---|
| 320 | + break; |
|---|
| 321 | + |
|---|
| 322 | + case XDP_TX: |
|---|
| 323 | + /* Buffer ownership passes to tx on success. */ |
|---|
| 324 | + xdpf = xdp_convert_buff_to_frame(&xdp); |
|---|
| 325 | + err = efx_xdp_tx_buffers(efx, 1, &xdpf, true); |
|---|
| 326 | + if (unlikely(err != 1)) { |
|---|
| 327 | + efx_free_rx_buffers(rx_queue, rx_buf, 1); |
|---|
| 328 | + if (net_ratelimit()) |
|---|
| 329 | + netif_err(efx, rx_err, efx->net_dev, |
|---|
| 330 | + "XDP TX failed (%d)\n", err); |
|---|
| 331 | + channel->n_rx_xdp_bad_drops++; |
|---|
| 332 | + trace_xdp_exception(efx->net_dev, xdp_prog, xdp_act); |
|---|
| 333 | + } else { |
|---|
| 334 | + channel->n_rx_xdp_tx++; |
|---|
| 335 | + } |
|---|
| 336 | + break; |
|---|
| 337 | + |
|---|
| 338 | + case XDP_REDIRECT: |
|---|
| 339 | + err = xdp_do_redirect(efx->net_dev, &xdp, xdp_prog); |
|---|
| 340 | + if (unlikely(err)) { |
|---|
| 341 | + efx_free_rx_buffers(rx_queue, rx_buf, 1); |
|---|
| 342 | + if (net_ratelimit()) |
|---|
| 343 | + netif_err(efx, rx_err, efx->net_dev, |
|---|
| 344 | + "XDP redirect failed (%d)\n", err); |
|---|
| 345 | + channel->n_rx_xdp_bad_drops++; |
|---|
| 346 | + trace_xdp_exception(efx->net_dev, xdp_prog, xdp_act); |
|---|
| 347 | + } else { |
|---|
| 348 | + channel->n_rx_xdp_redirect++; |
|---|
| 349 | + } |
|---|
| 350 | + break; |
|---|
| 351 | + |
|---|
| 352 | + default: |
|---|
| 353 | + bpf_warn_invalid_xdp_action(xdp_act); |
|---|
| 354 | + efx_free_rx_buffers(rx_queue, rx_buf, 1); |
|---|
| 355 | + channel->n_rx_xdp_bad_drops++; |
|---|
| 356 | + trace_xdp_exception(efx->net_dev, xdp_prog, xdp_act); |
|---|
| 357 | + break; |
|---|
| 358 | + |
|---|
| 359 | + case XDP_ABORTED: |
|---|
| 360 | + trace_xdp_exception(efx->net_dev, xdp_prog, xdp_act); |
|---|
| 361 | + fallthrough; |
|---|
| 362 | + case XDP_DROP: |
|---|
| 363 | + efx_free_rx_buffers(rx_queue, rx_buf, 1); |
|---|
| 364 | + channel->n_rx_xdp_drops++; |
|---|
| 365 | + break; |
|---|
| 366 | + } |
|---|
| 367 | + |
|---|
| 368 | + return xdp_act == XDP_PASS; |
|---|
| 369 | +} |
|---|
| 370 | + |
|---|
| 645 | 371 | /* Handle a received packet. Second half: Touches packet payload. */ |
|---|
| 646 | 372 | void __efx_rx_packet(struct efx_channel *channel) |
|---|
| 647 | 373 | { |
|---|
| .. | .. |
|---|
| 670 | 396 | goto out; |
|---|
| 671 | 397 | } |
|---|
| 672 | 398 | |
|---|
| 399 | + if (!efx_do_xdp(efx, channel, rx_buf, &eh)) |
|---|
| 400 | + goto out; |
|---|
| 401 | + |
|---|
| 673 | 402 | if (unlikely(!(efx->net_dev->features & NETIF_F_RXCSUM))) |
|---|
| 674 | 403 | rx_buf->flags &= ~EFX_RX_PKT_CSUMMED; |
|---|
| 675 | 404 | |
|---|
| 676 | 405 | if ((rx_buf->flags & EFX_RX_PKT_TCP) && !channel->type->receive_skb) |
|---|
| 677 | | - efx_rx_packet_gro(channel, rx_buf, channel->rx_pkt_n_frags, eh); |
|---|
| 406 | + efx_rx_packet_gro(channel, rx_buf, channel->rx_pkt_n_frags, eh, 0); |
|---|
| 678 | 407 | else |
|---|
| 679 | 408 | efx_rx_deliver(channel, eh, rx_buf, channel->rx_pkt_n_frags); |
|---|
| 680 | 409 | out: |
|---|
| 681 | 410 | channel->rx_pkt_n_frags = 0; |
|---|
| 682 | | -} |
|---|
| 683 | | - |
|---|
| 684 | | -int efx_probe_rx_queue(struct efx_rx_queue *rx_queue) |
|---|
| 685 | | -{ |
|---|
| 686 | | - struct efx_nic *efx = rx_queue->efx; |
|---|
| 687 | | - unsigned int entries; |
|---|
| 688 | | - int rc; |
|---|
| 689 | | - |
|---|
| 690 | | - /* Create the smallest power-of-two aligned ring */ |
|---|
| 691 | | - entries = max(roundup_pow_of_two(efx->rxq_entries), EFX_MIN_DMAQ_SIZE); |
|---|
| 692 | | - EFX_WARN_ON_PARANOID(entries > EFX_MAX_DMAQ_SIZE); |
|---|
| 693 | | - rx_queue->ptr_mask = entries - 1; |
|---|
| 694 | | - |
|---|
| 695 | | - netif_dbg(efx, probe, efx->net_dev, |
|---|
| 696 | | - "creating RX queue %d size %#x mask %#x\n", |
|---|
| 697 | | - efx_rx_queue_index(rx_queue), efx->rxq_entries, |
|---|
| 698 | | - rx_queue->ptr_mask); |
|---|
| 699 | | - |
|---|
| 700 | | - /* Allocate RX buffers */ |
|---|
| 701 | | - rx_queue->buffer = kcalloc(entries, sizeof(*rx_queue->buffer), |
|---|
| 702 | | - GFP_KERNEL); |
|---|
| 703 | | - if (!rx_queue->buffer) |
|---|
| 704 | | - return -ENOMEM; |
|---|
| 705 | | - |
|---|
| 706 | | - rc = efx_nic_probe_rx(rx_queue); |
|---|
| 707 | | - if (rc) { |
|---|
| 708 | | - kfree(rx_queue->buffer); |
|---|
| 709 | | - rx_queue->buffer = NULL; |
|---|
| 710 | | - } |
|---|
| 711 | | - |
|---|
| 712 | | - return rc; |
|---|
| 713 | | -} |
|---|
| 714 | | - |
|---|
| 715 | | -static void efx_init_rx_recycle_ring(struct efx_nic *efx, |
|---|
| 716 | | - struct efx_rx_queue *rx_queue) |
|---|
| 717 | | -{ |
|---|
| 718 | | - unsigned int bufs_in_recycle_ring, page_ring_size; |
|---|
| 719 | | - |
|---|
| 720 | | - /* Set the RX recycle ring size */ |
|---|
| 721 | | -#ifdef CONFIG_PPC64 |
|---|
| 722 | | - bufs_in_recycle_ring = EFX_RECYCLE_RING_SIZE_IOMMU; |
|---|
| 723 | | -#else |
|---|
| 724 | | - if (iommu_present(&pci_bus_type)) |
|---|
| 725 | | - bufs_in_recycle_ring = EFX_RECYCLE_RING_SIZE_IOMMU; |
|---|
| 726 | | - else |
|---|
| 727 | | - bufs_in_recycle_ring = EFX_RECYCLE_RING_SIZE_NOIOMMU; |
|---|
| 728 | | -#endif /* CONFIG_PPC64 */ |
|---|
| 729 | | - |
|---|
| 730 | | - page_ring_size = roundup_pow_of_two(bufs_in_recycle_ring / |
|---|
| 731 | | - efx->rx_bufs_per_page); |
|---|
| 732 | | - rx_queue->page_ring = kcalloc(page_ring_size, |
|---|
| 733 | | - sizeof(*rx_queue->page_ring), GFP_KERNEL); |
|---|
| 734 | | - rx_queue->page_ptr_mask = page_ring_size - 1; |
|---|
| 735 | | -} |
|---|
| 736 | | - |
|---|
| 737 | | -void efx_init_rx_queue(struct efx_rx_queue *rx_queue) |
|---|
| 738 | | -{ |
|---|
| 739 | | - struct efx_nic *efx = rx_queue->efx; |
|---|
| 740 | | - unsigned int max_fill, trigger, max_trigger; |
|---|
| 741 | | - |
|---|
| 742 | | - netif_dbg(rx_queue->efx, drv, rx_queue->efx->net_dev, |
|---|
| 743 | | - "initialising RX queue %d\n", efx_rx_queue_index(rx_queue)); |
|---|
| 744 | | - |
|---|
| 745 | | - /* Initialise ptr fields */ |
|---|
| 746 | | - rx_queue->added_count = 0; |
|---|
| 747 | | - rx_queue->notified_count = 0; |
|---|
| 748 | | - rx_queue->removed_count = 0; |
|---|
| 749 | | - rx_queue->min_fill = -1U; |
|---|
| 750 | | - efx_init_rx_recycle_ring(efx, rx_queue); |
|---|
| 751 | | - |
|---|
| 752 | | - rx_queue->page_remove = 0; |
|---|
| 753 | | - rx_queue->page_add = rx_queue->page_ptr_mask + 1; |
|---|
| 754 | | - rx_queue->page_recycle_count = 0; |
|---|
| 755 | | - rx_queue->page_recycle_failed = 0; |
|---|
| 756 | | - rx_queue->page_recycle_full = 0; |
|---|
| 757 | | - |
|---|
| 758 | | - /* Initialise limit fields */ |
|---|
| 759 | | - max_fill = efx->rxq_entries - EFX_RXD_HEAD_ROOM; |
|---|
| 760 | | - max_trigger = |
|---|
| 761 | | - max_fill - efx->rx_pages_per_batch * efx->rx_bufs_per_page; |
|---|
| 762 | | - if (rx_refill_threshold != 0) { |
|---|
| 763 | | - trigger = max_fill * min(rx_refill_threshold, 100U) / 100U; |
|---|
| 764 | | - if (trigger > max_trigger) |
|---|
| 765 | | - trigger = max_trigger; |
|---|
| 766 | | - } else { |
|---|
| 767 | | - trigger = max_trigger; |
|---|
| 768 | | - } |
|---|
| 769 | | - |
|---|
| 770 | | - rx_queue->max_fill = max_fill; |
|---|
| 771 | | - rx_queue->fast_fill_trigger = trigger; |
|---|
| 772 | | - rx_queue->refill_enabled = true; |
|---|
| 773 | | - |
|---|
| 774 | | - /* Set up RX descriptor ring */ |
|---|
| 775 | | - efx_nic_init_rx(rx_queue); |
|---|
| 776 | | -} |
|---|
| 777 | | - |
|---|
| 778 | | -void efx_fini_rx_queue(struct efx_rx_queue *rx_queue) |
|---|
| 779 | | -{ |
|---|
| 780 | | - int i; |
|---|
| 781 | | - struct efx_nic *efx = rx_queue->efx; |
|---|
| 782 | | - struct efx_rx_buffer *rx_buf; |
|---|
| 783 | | - |
|---|
| 784 | | - netif_dbg(rx_queue->efx, drv, rx_queue->efx->net_dev, |
|---|
| 785 | | - "shutting down RX queue %d\n", efx_rx_queue_index(rx_queue)); |
|---|
| 786 | | - |
|---|
| 787 | | - del_timer_sync(&rx_queue->slow_fill); |
|---|
| 788 | | - |
|---|
| 789 | | - /* Release RX buffers from the current read ptr to the write ptr */ |
|---|
| 790 | | - if (rx_queue->buffer) { |
|---|
| 791 | | - for (i = rx_queue->removed_count; i < rx_queue->added_count; |
|---|
| 792 | | - i++) { |
|---|
| 793 | | - unsigned index = i & rx_queue->ptr_mask; |
|---|
| 794 | | - rx_buf = efx_rx_buffer(rx_queue, index); |
|---|
| 795 | | - efx_fini_rx_buffer(rx_queue, rx_buf); |
|---|
| 796 | | - } |
|---|
| 797 | | - } |
|---|
| 798 | | - |
|---|
| 799 | | - /* Unmap and release the pages in the recycle ring. Remove the ring. */ |
|---|
| 800 | | - for (i = 0; i <= rx_queue->page_ptr_mask; i++) { |
|---|
| 801 | | - struct page *page = rx_queue->page_ring[i]; |
|---|
| 802 | | - struct efx_rx_page_state *state; |
|---|
| 803 | | - |
|---|
| 804 | | - if (page == NULL) |
|---|
| 805 | | - continue; |
|---|
| 806 | | - |
|---|
| 807 | | - state = page_address(page); |
|---|
| 808 | | - dma_unmap_page(&efx->pci_dev->dev, state->dma_addr, |
|---|
| 809 | | - PAGE_SIZE << efx->rx_buffer_order, |
|---|
| 810 | | - DMA_FROM_DEVICE); |
|---|
| 811 | | - put_page(page); |
|---|
| 812 | | - } |
|---|
| 813 | | - kfree(rx_queue->page_ring); |
|---|
| 814 | | - rx_queue->page_ring = NULL; |
|---|
| 815 | | -} |
|---|
| 816 | | - |
|---|
| 817 | | -void efx_remove_rx_queue(struct efx_rx_queue *rx_queue) |
|---|
| 818 | | -{ |
|---|
| 819 | | - netif_dbg(rx_queue->efx, drv, rx_queue->efx->net_dev, |
|---|
| 820 | | - "destroying RX queue %d\n", efx_rx_queue_index(rx_queue)); |
|---|
| 821 | | - |
|---|
| 822 | | - efx_nic_remove_rx(rx_queue); |
|---|
| 823 | | - |
|---|
| 824 | | - kfree(rx_queue->buffer); |
|---|
| 825 | | - rx_queue->buffer = NULL; |
|---|
| 826 | | -} |
|---|
| 827 | | - |
|---|
| 828 | | - |
|---|
| 829 | | -module_param(rx_refill_threshold, uint, 0444); |
|---|
| 830 | | -MODULE_PARM_DESC(rx_refill_threshold, |
|---|
| 831 | | - "RX descriptor ring refill threshold (%)"); |
|---|
| 832 | | - |
|---|
| 833 | | -#ifdef CONFIG_RFS_ACCEL |
|---|
| 834 | | - |
|---|
| 835 | | -static void efx_filter_rfs_work(struct work_struct *data) |
|---|
| 836 | | -{ |
|---|
| 837 | | - struct efx_async_filter_insertion *req = container_of(data, struct efx_async_filter_insertion, |
|---|
| 838 | | - work); |
|---|
| 839 | | - struct efx_nic *efx = netdev_priv(req->net_dev); |
|---|
| 840 | | - struct efx_channel *channel = efx_get_channel(efx, req->rxq_index); |
|---|
| 841 | | - int slot_idx = req - efx->rps_slot; |
|---|
| 842 | | - struct efx_arfs_rule *rule; |
|---|
| 843 | | - u16 arfs_id = 0; |
|---|
| 844 | | - int rc; |
|---|
| 845 | | - |
|---|
| 846 | | - rc = efx->type->filter_insert(efx, &req->spec, true); |
|---|
| 847 | | - if (rc >= 0) |
|---|
| 848 | | - rc %= efx->type->max_rx_ip_filters; |
|---|
| 849 | | - if (efx->rps_hash_table) { |
|---|
| 850 | | - spin_lock_bh(&efx->rps_hash_lock); |
|---|
| 851 | | - rule = efx_rps_hash_find(efx, &req->spec); |
|---|
| 852 | | - /* The rule might have already gone, if someone else's request |
|---|
| 853 | | - * for the same spec was already worked and then expired before |
|---|
| 854 | | - * we got around to our work. In that case we have nothing |
|---|
| 855 | | - * tying us to an arfs_id, meaning that as soon as the filter |
|---|
| 856 | | - * is considered for expiry it will be removed. |
|---|
| 857 | | - */ |
|---|
| 858 | | - if (rule) { |
|---|
| 859 | | - if (rc < 0) |
|---|
| 860 | | - rule->filter_id = EFX_ARFS_FILTER_ID_ERROR; |
|---|
| 861 | | - else |
|---|
| 862 | | - rule->filter_id = rc; |
|---|
| 863 | | - arfs_id = rule->arfs_id; |
|---|
| 864 | | - } |
|---|
| 865 | | - spin_unlock_bh(&efx->rps_hash_lock); |
|---|
| 866 | | - } |
|---|
| 867 | | - if (rc >= 0) { |
|---|
| 868 | | - /* Remember this so we can check whether to expire the filter |
|---|
| 869 | | - * later. |
|---|
| 870 | | - */ |
|---|
| 871 | | - mutex_lock(&efx->rps_mutex); |
|---|
| 872 | | - channel->rps_flow_id[rc] = req->flow_id; |
|---|
| 873 | | - ++channel->rfs_filters_added; |
|---|
| 874 | | - mutex_unlock(&efx->rps_mutex); |
|---|
| 875 | | - |
|---|
| 876 | | - if (req->spec.ether_type == htons(ETH_P_IP)) |
|---|
| 877 | | - netif_info(efx, rx_status, efx->net_dev, |
|---|
| 878 | | - "steering %s %pI4:%u:%pI4:%u to queue %u [flow %u filter %d id %u]\n", |
|---|
| 879 | | - (req->spec.ip_proto == IPPROTO_TCP) ? "TCP" : "UDP", |
|---|
| 880 | | - req->spec.rem_host, ntohs(req->spec.rem_port), |
|---|
| 881 | | - req->spec.loc_host, ntohs(req->spec.loc_port), |
|---|
| 882 | | - req->rxq_index, req->flow_id, rc, arfs_id); |
|---|
| 883 | | - else |
|---|
| 884 | | - netif_info(efx, rx_status, efx->net_dev, |
|---|
| 885 | | - "steering %s [%pI6]:%u:[%pI6]:%u to queue %u [flow %u filter %d id %u]\n", |
|---|
| 886 | | - (req->spec.ip_proto == IPPROTO_TCP) ? "TCP" : "UDP", |
|---|
| 887 | | - req->spec.rem_host, ntohs(req->spec.rem_port), |
|---|
| 888 | | - req->spec.loc_host, ntohs(req->spec.loc_port), |
|---|
| 889 | | - req->rxq_index, req->flow_id, rc, arfs_id); |
|---|
| 890 | | - } |
|---|
| 891 | | - |
|---|
| 892 | | - /* Release references */ |
|---|
| 893 | | - clear_bit(slot_idx, &efx->rps_slot_map); |
|---|
| 894 | | - dev_put(req->net_dev); |
|---|
| 895 | | -} |
|---|
| 896 | | - |
|---|
| 897 | | -int efx_filter_rfs(struct net_device *net_dev, const struct sk_buff *skb, |
|---|
| 898 | | - u16 rxq_index, u32 flow_id) |
|---|
| 899 | | -{ |
|---|
| 900 | | - struct efx_nic *efx = netdev_priv(net_dev); |
|---|
| 901 | | - struct efx_async_filter_insertion *req; |
|---|
| 902 | | - struct efx_arfs_rule *rule; |
|---|
| 903 | | - struct flow_keys fk; |
|---|
| 904 | | - int slot_idx; |
|---|
| 905 | | - bool new; |
|---|
| 906 | | - int rc; |
|---|
| 907 | | - |
|---|
| 908 | | - /* find a free slot */ |
|---|
| 909 | | - for (slot_idx = 0; slot_idx < EFX_RPS_MAX_IN_FLIGHT; slot_idx++) |
|---|
| 910 | | - if (!test_and_set_bit(slot_idx, &efx->rps_slot_map)) |
|---|
| 911 | | - break; |
|---|
| 912 | | - if (slot_idx >= EFX_RPS_MAX_IN_FLIGHT) |
|---|
| 913 | | - return -EBUSY; |
|---|
| 914 | | - |
|---|
| 915 | | - if (flow_id == RPS_FLOW_ID_INVALID) { |
|---|
| 916 | | - rc = -EINVAL; |
|---|
| 917 | | - goto out_clear; |
|---|
| 918 | | - } |
|---|
| 919 | | - |
|---|
| 920 | | - if (!skb_flow_dissect_flow_keys(skb, &fk, 0)) { |
|---|
| 921 | | - rc = -EPROTONOSUPPORT; |
|---|
| 922 | | - goto out_clear; |
|---|
| 923 | | - } |
|---|
| 924 | | - |
|---|
| 925 | | - if (fk.basic.n_proto != htons(ETH_P_IP) && fk.basic.n_proto != htons(ETH_P_IPV6)) { |
|---|
| 926 | | - rc = -EPROTONOSUPPORT; |
|---|
| 927 | | - goto out_clear; |
|---|
| 928 | | - } |
|---|
| 929 | | - if (fk.control.flags & FLOW_DIS_IS_FRAGMENT) { |
|---|
| 930 | | - rc = -EPROTONOSUPPORT; |
|---|
| 931 | | - goto out_clear; |
|---|
| 932 | | - } |
|---|
| 933 | | - |
|---|
| 934 | | - req = efx->rps_slot + slot_idx; |
|---|
| 935 | | - efx_filter_init_rx(&req->spec, EFX_FILTER_PRI_HINT, |
|---|
| 936 | | - efx->rx_scatter ? EFX_FILTER_FLAG_RX_SCATTER : 0, |
|---|
| 937 | | - rxq_index); |
|---|
| 938 | | - req->spec.match_flags = |
|---|
| 939 | | - EFX_FILTER_MATCH_ETHER_TYPE | EFX_FILTER_MATCH_IP_PROTO | |
|---|
| 940 | | - EFX_FILTER_MATCH_LOC_HOST | EFX_FILTER_MATCH_LOC_PORT | |
|---|
| 941 | | - EFX_FILTER_MATCH_REM_HOST | EFX_FILTER_MATCH_REM_PORT; |
|---|
| 942 | | - req->spec.ether_type = fk.basic.n_proto; |
|---|
| 943 | | - req->spec.ip_proto = fk.basic.ip_proto; |
|---|
| 944 | | - |
|---|
| 945 | | - if (fk.basic.n_proto == htons(ETH_P_IP)) { |
|---|
| 946 | | - req->spec.rem_host[0] = fk.addrs.v4addrs.src; |
|---|
| 947 | | - req->spec.loc_host[0] = fk.addrs.v4addrs.dst; |
|---|
| 948 | | - } else { |
|---|
| 949 | | - memcpy(req->spec.rem_host, &fk.addrs.v6addrs.src, |
|---|
| 950 | | - sizeof(struct in6_addr)); |
|---|
| 951 | | - memcpy(req->spec.loc_host, &fk.addrs.v6addrs.dst, |
|---|
| 952 | | - sizeof(struct in6_addr)); |
|---|
| 953 | | - } |
|---|
| 954 | | - |
|---|
| 955 | | - req->spec.rem_port = fk.ports.src; |
|---|
| 956 | | - req->spec.loc_port = fk.ports.dst; |
|---|
| 957 | | - |
|---|
| 958 | | - if (efx->rps_hash_table) { |
|---|
| 959 | | - /* Add it to ARFS hash table */ |
|---|
| 960 | | - spin_lock(&efx->rps_hash_lock); |
|---|
| 961 | | - rule = efx_rps_hash_add(efx, &req->spec, &new); |
|---|
| 962 | | - if (!rule) { |
|---|
| 963 | | - rc = -ENOMEM; |
|---|
| 964 | | - goto out_unlock; |
|---|
| 965 | | - } |
|---|
| 966 | | - if (new) |
|---|
| 967 | | - rule->arfs_id = efx->rps_next_id++ % RPS_NO_FILTER; |
|---|
| 968 | | - rc = rule->arfs_id; |
|---|
| 969 | | - /* Skip if existing or pending filter already does the right thing */ |
|---|
| 970 | | - if (!new && rule->rxq_index == rxq_index && |
|---|
| 971 | | - rule->filter_id >= EFX_ARFS_FILTER_ID_PENDING) |
|---|
| 972 | | - goto out_unlock; |
|---|
| 973 | | - rule->rxq_index = rxq_index; |
|---|
| 974 | | - rule->filter_id = EFX_ARFS_FILTER_ID_PENDING; |
|---|
| 975 | | - spin_unlock(&efx->rps_hash_lock); |
|---|
| 976 | | - } else { |
|---|
| 977 | | - /* Without an ARFS hash table, we just use arfs_id 0 for all |
|---|
| 978 | | - * filters. This means if multiple flows hash to the same |
|---|
| 979 | | - * flow_id, all but the most recently touched will be eligible |
|---|
| 980 | | - * for expiry. |
|---|
| 981 | | - */ |
|---|
| 982 | | - rc = 0; |
|---|
| 983 | | - } |
|---|
| 984 | | - |
|---|
| 985 | | - /* Queue the request */ |
|---|
| 986 | | - dev_hold(req->net_dev = net_dev); |
|---|
| 987 | | - INIT_WORK(&req->work, efx_filter_rfs_work); |
|---|
| 988 | | - req->rxq_index = rxq_index; |
|---|
| 989 | | - req->flow_id = flow_id; |
|---|
| 990 | | - schedule_work(&req->work); |
|---|
| 991 | | - return rc; |
|---|
| 992 | | -out_unlock: |
|---|
| 993 | | - spin_unlock(&efx->rps_hash_lock); |
|---|
| 994 | | -out_clear: |
|---|
| 995 | | - clear_bit(slot_idx, &efx->rps_slot_map); |
|---|
| 996 | | - return rc; |
|---|
| 997 | | -} |
|---|
| 998 | | - |
|---|
| 999 | | -bool __efx_filter_rfs_expire(struct efx_nic *efx, unsigned int quota) |
|---|
| 1000 | | -{ |
|---|
| 1001 | | - bool (*expire_one)(struct efx_nic *efx, u32 flow_id, unsigned int index); |
|---|
| 1002 | | - unsigned int channel_idx, index, size; |
|---|
| 1003 | | - u32 flow_id; |
|---|
| 1004 | | - |
|---|
| 1005 | | - if (!mutex_trylock(&efx->rps_mutex)) |
|---|
| 1006 | | - return false; |
|---|
| 1007 | | - expire_one = efx->type->filter_rfs_expire_one; |
|---|
| 1008 | | - channel_idx = efx->rps_expire_channel; |
|---|
| 1009 | | - index = efx->rps_expire_index; |
|---|
| 1010 | | - size = efx->type->max_rx_ip_filters; |
|---|
| 1011 | | - while (quota--) { |
|---|
| 1012 | | - struct efx_channel *channel = efx_get_channel(efx, channel_idx); |
|---|
| 1013 | | - flow_id = channel->rps_flow_id[index]; |
|---|
| 1014 | | - |
|---|
| 1015 | | - if (flow_id != RPS_FLOW_ID_INVALID && |
|---|
| 1016 | | - expire_one(efx, flow_id, index)) { |
|---|
| 1017 | | - netif_info(efx, rx_status, efx->net_dev, |
|---|
| 1018 | | - "expired filter %d [queue %u flow %u]\n", |
|---|
| 1019 | | - index, channel_idx, flow_id); |
|---|
| 1020 | | - channel->rps_flow_id[index] = RPS_FLOW_ID_INVALID; |
|---|
| 1021 | | - } |
|---|
| 1022 | | - if (++index == size) { |
|---|
| 1023 | | - if (++channel_idx == efx->n_channels) |
|---|
| 1024 | | - channel_idx = 0; |
|---|
| 1025 | | - index = 0; |
|---|
| 1026 | | - } |
|---|
| 1027 | | - } |
|---|
| 1028 | | - efx->rps_expire_channel = channel_idx; |
|---|
| 1029 | | - efx->rps_expire_index = index; |
|---|
| 1030 | | - |
|---|
| 1031 | | - mutex_unlock(&efx->rps_mutex); |
|---|
| 1032 | | - return true; |
|---|
| 1033 | | -} |
|---|
| 1034 | | - |
|---|
| 1035 | | -#endif /* CONFIG_RFS_ACCEL */ |
|---|
| 1036 | | - |
|---|
| 1037 | | -/** |
|---|
| 1038 | | - * efx_filter_is_mc_recipient - test whether spec is a multicast recipient |
|---|
| 1039 | | - * @spec: Specification to test |
|---|
| 1040 | | - * |
|---|
| 1041 | | - * Return: %true if the specification is a non-drop RX filter that |
|---|
| 1042 | | - * matches a local MAC address I/G bit value of 1 or matches a local |
|---|
| 1043 | | - * IPv4 or IPv6 address value in the respective multicast address |
|---|
| 1044 | | - * range. Otherwise %false. |
|---|
| 1045 | | - */ |
|---|
| 1046 | | -bool efx_filter_is_mc_recipient(const struct efx_filter_spec *spec) |
|---|
| 1047 | | -{ |
|---|
| 1048 | | - if (!(spec->flags & EFX_FILTER_FLAG_RX) || |
|---|
| 1049 | | - spec->dmaq_id == EFX_FILTER_RX_DMAQ_ID_DROP) |
|---|
| 1050 | | - return false; |
|---|
| 1051 | | - |
|---|
| 1052 | | - if (spec->match_flags & |
|---|
| 1053 | | - (EFX_FILTER_MATCH_LOC_MAC | EFX_FILTER_MATCH_LOC_MAC_IG) && |
|---|
| 1054 | | - is_multicast_ether_addr(spec->loc_mac)) |
|---|
| 1055 | | - return true; |
|---|
| 1056 | | - |
|---|
| 1057 | | - if ((spec->match_flags & |
|---|
| 1058 | | - (EFX_FILTER_MATCH_ETHER_TYPE | EFX_FILTER_MATCH_LOC_HOST)) == |
|---|
| 1059 | | - (EFX_FILTER_MATCH_ETHER_TYPE | EFX_FILTER_MATCH_LOC_HOST)) { |
|---|
| 1060 | | - if (spec->ether_type == htons(ETH_P_IP) && |
|---|
| 1061 | | - ipv4_is_multicast(spec->loc_host[0])) |
|---|
| 1062 | | - return true; |
|---|
| 1063 | | - if (spec->ether_type == htons(ETH_P_IPV6) && |
|---|
| 1064 | | - ((const u8 *)spec->loc_host)[0] == 0xff) |
|---|
| 1065 | | - return true; |
|---|
| 1066 | | - } |
|---|
| 1067 | | - |
|---|
| 1068 | | - return false; |
|---|
| 1069 | 411 | } |
|---|