| /* |
| * Copyright(c) 2017 Intel Corporation. |
| * |
| * This file is provided under a dual BSD/GPLv2 license. When using or |
| * redistributing this file, you may do so under either license. |
| * |
| * GPL LICENSE SUMMARY |
| * |
| * This program is free software; you can redistribute it and/or modify |
| * it under the terms of version 2 of the GNU General Public License as |
| * published by the Free Software Foundation. |
| * |
| * This program is distributed in the hope that it will be useful, but |
| * WITHOUT ANY WARRANTY; without even the implied warranty of |
| * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| * General Public License for more details. |
| * |
| * BSD LICENSE |
| * |
| * Redistribution and use in source and binary forms, with or without |
| * modification, are permitted provided that the following conditions |
| * are met: |
| * |
| * - Redistributions of source code must retain the above copyright |
| * notice, this list of conditions and the following disclaimer. |
| * - Redistributions in binary form must reproduce the above copyright |
| * notice, this list of conditions and the following disclaimer in |
| * the documentation and/or other materials provided with the |
| * distribution. |
| * - Neither the name of Intel Corporation nor the names of its |
| * contributors may be used to endorse or promote products derived |
| * from this software without specific prior written permission. |
| * |
| * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
| * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
| * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
| * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT |
| * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
| * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT |
| * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
| * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
| * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
| * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
| * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| * |
| */ |
| |
| /* |
| * This file contains HFI1 support for VNIC functionality |
| */ |
| |
| #include <linux/io.h> |
| #include <linux/if_vlan.h> |
| |
| #include "vnic.h" |
| |
| #define HFI_TX_TIMEOUT_MS 1000 |
| |
| #define HFI1_VNIC_RCV_Q_SIZE 1024 |
| |
| #define HFI1_VNIC_UP 0 |
| |
| static DEFINE_SPINLOCK(vport_cntr_lock); |
| |
| static int setup_vnic_ctxt(struct hfi1_devdata *dd, struct hfi1_ctxtdata *uctxt) |
| { |
| unsigned int rcvctrl_ops = 0; |
| int ret; |
| |
| hfi1_init_ctxt(uctxt->sc); |
| |
| uctxt->do_interrupt = &handle_receive_interrupt; |
| |
| /* Now allocate the RcvHdr queue and eager buffers. */ |
| ret = hfi1_create_rcvhdrq(dd, uctxt); |
| if (ret) |
| goto done; |
| |
| ret = hfi1_setup_eagerbufs(uctxt); |
| if (ret) |
| goto done; |
| |
| if (uctxt->rcvhdrtail_kvaddr) |
| clear_rcvhdrtail(uctxt); |
| |
| rcvctrl_ops = HFI1_RCVCTRL_CTXT_ENB; |
| rcvctrl_ops |= HFI1_RCVCTRL_INTRAVAIL_ENB; |
| |
| if (!HFI1_CAP_KGET_MASK(uctxt->flags, MULTI_PKT_EGR)) |
| rcvctrl_ops |= HFI1_RCVCTRL_ONE_PKT_EGR_ENB; |
| if (HFI1_CAP_KGET_MASK(uctxt->flags, NODROP_EGR_FULL)) |
| rcvctrl_ops |= HFI1_RCVCTRL_NO_EGR_DROP_ENB; |
| if (HFI1_CAP_KGET_MASK(uctxt->flags, NODROP_RHQ_FULL)) |
| rcvctrl_ops |= HFI1_RCVCTRL_NO_RHQ_DROP_ENB; |
| if (HFI1_CAP_KGET_MASK(uctxt->flags, DMA_RTAIL)) |
| rcvctrl_ops |= HFI1_RCVCTRL_TAILUPD_ENB; |
| |
| hfi1_rcvctrl(uctxt->dd, rcvctrl_ops, uctxt); |
| |
| uctxt->is_vnic = true; |
| done: |
| return ret; |
| } |
| |
| static int allocate_vnic_ctxt(struct hfi1_devdata *dd, |
| struct hfi1_ctxtdata **vnic_ctxt) |
| { |
| struct hfi1_ctxtdata *uctxt; |
| int ret; |
| |
| if (dd->flags & HFI1_FROZEN) |
| return -EIO; |
| |
| ret = hfi1_create_ctxtdata(dd->pport, dd->node, &uctxt); |
| if (ret < 0) { |
| dd_dev_err(dd, "Unable to create ctxtdata, failing open\n"); |
| return -ENOMEM; |
| } |
| |
| uctxt->flags = HFI1_CAP_KGET(MULTI_PKT_EGR) | |
| HFI1_CAP_KGET(NODROP_RHQ_FULL) | |
| HFI1_CAP_KGET(NODROP_EGR_FULL) | |
| HFI1_CAP_KGET(DMA_RTAIL); |
| uctxt->seq_cnt = 1; |
| |
| /* Allocate and enable a PIO send context */ |
| uctxt->sc = sc_alloc(dd, SC_VNIC, uctxt->rcvhdrqentsize, |
| uctxt->numa_id); |
| |
| ret = uctxt->sc ? 0 : -ENOMEM; |
| if (ret) |
| goto bail; |
| |
| dd_dev_dbg(dd, "allocated vnic send context %u(%u)\n", |
| uctxt->sc->sw_index, uctxt->sc->hw_context); |
| ret = sc_enable(uctxt->sc); |
| if (ret) |
| goto bail; |
| |
| if (dd->num_msix_entries) |
| hfi1_set_vnic_msix_info(uctxt); |
| |
| hfi1_stats.sps_ctxts++; |
| dd_dev_dbg(dd, "created vnic context %d\n", uctxt->ctxt); |
| *vnic_ctxt = uctxt; |
| |
| return ret; |
| bail: |
| hfi1_free_ctxt(uctxt); |
| dd_dev_dbg(dd, "vnic allocation failed. rc %d\n", ret); |
| return ret; |
| } |
| |
| static void deallocate_vnic_ctxt(struct hfi1_devdata *dd, |
| struct hfi1_ctxtdata *uctxt) |
| { |
| dd_dev_dbg(dd, "closing vnic context %d\n", uctxt->ctxt); |
| flush_wc(); |
| |
| if (dd->num_msix_entries) |
| hfi1_reset_vnic_msix_info(uctxt); |
| |
| /* |
| * Disable receive context and interrupt available, reset all |
| * RcvCtxtCtrl bits to default values. |
| */ |
| hfi1_rcvctrl(dd, HFI1_RCVCTRL_CTXT_DIS | |
| HFI1_RCVCTRL_TIDFLOW_DIS | |
| HFI1_RCVCTRL_INTRAVAIL_DIS | |
| HFI1_RCVCTRL_ONE_PKT_EGR_DIS | |
| HFI1_RCVCTRL_NO_RHQ_DROP_DIS | |
| HFI1_RCVCTRL_NO_EGR_DROP_DIS, uctxt); |
| /* |
| * VNIC contexts are allocated from user context pool. |
| * Release them back to user context pool. |
| * |
| * Reset context integrity checks to default. |
| * (writes to CSRs probably belong in chip.c) |
| */ |
| write_kctxt_csr(dd, uctxt->sc->hw_context, SEND_CTXT_CHECK_ENABLE, |
| hfi1_pkt_default_send_ctxt_mask(dd, SC_USER)); |
| sc_disable(uctxt->sc); |
| |
| dd->send_contexts[uctxt->sc->sw_index].type = SC_USER; |
| |
| uctxt->event_flags = 0; |
| |
| hfi1_clear_tids(uctxt); |
| hfi1_clear_ctxt_pkey(dd, uctxt); |
| |
| hfi1_stats.sps_ctxts--; |
| |
| hfi1_free_ctxt(uctxt); |
| } |
| |
| void hfi1_vnic_setup(struct hfi1_devdata *dd) |
| { |
| idr_init(&dd->vnic.vesw_idr); |
| } |
| |
| void hfi1_vnic_cleanup(struct hfi1_devdata *dd) |
| { |
| idr_destroy(&dd->vnic.vesw_idr); |
| } |
| |
| #define SUM_GRP_COUNTERS(stats, qstats, x_grp) do { \ |
| u64 *src64, *dst64; \ |
| for (src64 = &qstats->x_grp.unicast, \ |
| dst64 = &stats->x_grp.unicast; \ |
| dst64 <= &stats->x_grp.s_1519_max;) { \ |
| *dst64++ += *src64++; \ |
| } \ |
| } while (0) |
| |
| /* hfi1_vnic_update_stats - update statistics */ |
| static void hfi1_vnic_update_stats(struct hfi1_vnic_vport_info *vinfo, |
| struct opa_vnic_stats *stats) |
| { |
| struct net_device *netdev = vinfo->netdev; |
| u8 i; |
| |
| /* add tx counters on different queues */ |
| for (i = 0; i < vinfo->num_tx_q; i++) { |
| struct opa_vnic_stats *qstats = &vinfo->stats[i]; |
| struct rtnl_link_stats64 *qnstats = &vinfo->stats[i].netstats; |
| |
| stats->netstats.tx_fifo_errors += qnstats->tx_fifo_errors; |
| stats->netstats.tx_carrier_errors += qnstats->tx_carrier_errors; |
| stats->tx_drop_state += qstats->tx_drop_state; |
| stats->tx_dlid_zero += qstats->tx_dlid_zero; |
| |
| SUM_GRP_COUNTERS(stats, qstats, tx_grp); |
| stats->netstats.tx_packets += qnstats->tx_packets; |
| stats->netstats.tx_bytes += qnstats->tx_bytes; |
| } |
| |
| /* add rx counters on different queues */ |
| for (i = 0; i < vinfo->num_rx_q; i++) { |
| struct opa_vnic_stats *qstats = &vinfo->stats[i]; |
| struct rtnl_link_stats64 *qnstats = &vinfo->stats[i].netstats; |
| |
| stats->netstats.rx_fifo_errors += qnstats->rx_fifo_errors; |
| stats->netstats.rx_nohandler += qnstats->rx_nohandler; |
| stats->rx_drop_state += qstats->rx_drop_state; |
| stats->rx_oversize += qstats->rx_oversize; |
| stats->rx_runt += qstats->rx_runt; |
| |
| SUM_GRP_COUNTERS(stats, qstats, rx_grp); |
| stats->netstats.rx_packets += qnstats->rx_packets; |
| stats->netstats.rx_bytes += qnstats->rx_bytes; |
| } |
| |
| stats->netstats.tx_errors = stats->netstats.tx_fifo_errors + |
| stats->netstats.tx_carrier_errors + |
| stats->tx_drop_state + stats->tx_dlid_zero; |
| stats->netstats.tx_dropped = stats->netstats.tx_errors; |
| |
| stats->netstats.rx_errors = stats->netstats.rx_fifo_errors + |
| stats->netstats.rx_nohandler + |
| stats->rx_drop_state + stats->rx_oversize + |
| stats->rx_runt; |
| stats->netstats.rx_dropped = stats->netstats.rx_errors; |
| |
| netdev->stats.tx_packets = stats->netstats.tx_packets; |
| netdev->stats.tx_bytes = stats->netstats.tx_bytes; |
| netdev->stats.tx_fifo_errors = stats->netstats.tx_fifo_errors; |
| netdev->stats.tx_carrier_errors = stats->netstats.tx_carrier_errors; |
| netdev->stats.tx_errors = stats->netstats.tx_errors; |
| netdev->stats.tx_dropped = stats->netstats.tx_dropped; |
| |
| netdev->stats.rx_packets = stats->netstats.rx_packets; |
| netdev->stats.rx_bytes = stats->netstats.rx_bytes; |
| netdev->stats.rx_fifo_errors = stats->netstats.rx_fifo_errors; |
| netdev->stats.multicast = stats->rx_grp.mcastbcast; |
| netdev->stats.rx_length_errors = stats->rx_oversize + stats->rx_runt; |
| netdev->stats.rx_errors = stats->netstats.rx_errors; |
| netdev->stats.rx_dropped = stats->netstats.rx_dropped; |
| } |
| |
| /* update_len_counters - update pkt's len histogram counters */ |
| static inline void update_len_counters(struct opa_vnic_grp_stats *grp, |
| int len) |
| { |
| /* account for 4 byte FCS */ |
| if (len >= 1515) |
| grp->s_1519_max++; |
| else if (len >= 1020) |
| grp->s_1024_1518++; |
| else if (len >= 508) |
| grp->s_512_1023++; |
| else if (len >= 252) |
| grp->s_256_511++; |
| else if (len >= 124) |
| grp->s_128_255++; |
| else if (len >= 61) |
| grp->s_65_127++; |
| else |
| grp->s_64++; |
| } |
| |
| /* hfi1_vnic_update_tx_counters - update transmit counters */ |
| static void hfi1_vnic_update_tx_counters(struct hfi1_vnic_vport_info *vinfo, |
| u8 q_idx, struct sk_buff *skb, int err) |
| { |
| struct ethhdr *mac_hdr = (struct ethhdr *)skb_mac_header(skb); |
| struct opa_vnic_stats *stats = &vinfo->stats[q_idx]; |
| struct opa_vnic_grp_stats *tx_grp = &stats->tx_grp; |
| u16 vlan_tci; |
| |
| stats->netstats.tx_packets++; |
| stats->netstats.tx_bytes += skb->len + ETH_FCS_LEN; |
| |
| update_len_counters(tx_grp, skb->len); |
| |
| /* rest of the counts are for good packets only */ |
| if (unlikely(err)) |
| return; |
| |
| if (is_multicast_ether_addr(mac_hdr->h_dest)) |
| tx_grp->mcastbcast++; |
| else |
| tx_grp->unicast++; |
| |
| if (!__vlan_get_tag(skb, &vlan_tci)) |
| tx_grp->vlan++; |
| else |
| tx_grp->untagged++; |
| } |
| |
| /* hfi1_vnic_update_rx_counters - update receive counters */ |
| static void hfi1_vnic_update_rx_counters(struct hfi1_vnic_vport_info *vinfo, |
| u8 q_idx, struct sk_buff *skb, int err) |
| { |
| struct ethhdr *mac_hdr = (struct ethhdr *)skb->data; |
| struct opa_vnic_stats *stats = &vinfo->stats[q_idx]; |
| struct opa_vnic_grp_stats *rx_grp = &stats->rx_grp; |
| u16 vlan_tci; |
| |
| stats->netstats.rx_packets++; |
| stats->netstats.rx_bytes += skb->len + ETH_FCS_LEN; |
| |
| update_len_counters(rx_grp, skb->len); |
| |
| /* rest of the counts are for good packets only */ |
| if (unlikely(err)) |
| return; |
| |
| if (is_multicast_ether_addr(mac_hdr->h_dest)) |
| rx_grp->mcastbcast++; |
| else |
| rx_grp->unicast++; |
| |
| if (!__vlan_get_tag(skb, &vlan_tci)) |
| rx_grp->vlan++; |
| else |
| rx_grp->untagged++; |
| } |
| |
| /* This function is overloaded for opa_vnic specific implementation */ |
| static void hfi1_vnic_get_stats64(struct net_device *netdev, |
| struct rtnl_link_stats64 *stats) |
| { |
| struct opa_vnic_stats *vstats = (struct opa_vnic_stats *)stats; |
| struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev); |
| |
| hfi1_vnic_update_stats(vinfo, vstats); |
| } |
| |
| static u64 create_bypass_pbc(u32 vl, u32 dw_len) |
| { |
| u64 pbc; |
| |
| pbc = ((u64)PBC_IHCRC_NONE << PBC_INSERT_HCRC_SHIFT) |
| | PBC_INSERT_BYPASS_ICRC | PBC_CREDIT_RETURN |
| | PBC_PACKET_BYPASS |
| | ((vl & PBC_VL_MASK) << PBC_VL_SHIFT) |
| | (dw_len & PBC_LENGTH_DWS_MASK) << PBC_LENGTH_DWS_SHIFT; |
| |
| return pbc; |
| } |
| |
| /* hfi1_vnic_maybe_stop_tx - stop tx queue if required */ |
| static void hfi1_vnic_maybe_stop_tx(struct hfi1_vnic_vport_info *vinfo, |
| u8 q_idx) |
| { |
| netif_stop_subqueue(vinfo->netdev, q_idx); |
| if (!hfi1_vnic_sdma_write_avail(vinfo, q_idx)) |
| return; |
| |
| netif_start_subqueue(vinfo->netdev, q_idx); |
| } |
| |
| static netdev_tx_t hfi1_netdev_start_xmit(struct sk_buff *skb, |
| struct net_device *netdev) |
| { |
| struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev); |
| u8 pad_len, q_idx = skb->queue_mapping; |
| struct hfi1_devdata *dd = vinfo->dd; |
| struct opa_vnic_skb_mdata *mdata; |
| u32 pkt_len, total_len; |
| int err = -EINVAL; |
| u64 pbc; |
| |
| v_dbg("xmit: queue %d skb len %d\n", q_idx, skb->len); |
| if (unlikely(!netif_oper_up(netdev))) { |
| vinfo->stats[q_idx].tx_drop_state++; |
| goto tx_finish; |
| } |
| |
| /* take out meta data */ |
| mdata = (struct opa_vnic_skb_mdata *)skb->data; |
| skb_pull(skb, sizeof(*mdata)); |
| if (unlikely(mdata->flags & OPA_VNIC_SKB_MDATA_ENCAP_ERR)) { |
| vinfo->stats[q_idx].tx_dlid_zero++; |
| goto tx_finish; |
| } |
| |
| /* add tail padding (for 8 bytes size alignment) and icrc */ |
| pad_len = -(skb->len + OPA_VNIC_ICRC_TAIL_LEN) & 0x7; |
| pad_len += OPA_VNIC_ICRC_TAIL_LEN; |
| |
| /* |
| * pkt_len is how much data we have to write, includes header and data. |
| * total_len is length of the packet in Dwords plus the PBC should not |
| * include the CRC. |
| */ |
| pkt_len = (skb->len + pad_len) >> 2; |
| total_len = pkt_len + 2; /* PBC + packet */ |
| |
| pbc = create_bypass_pbc(mdata->vl, total_len); |
| |
| skb_get(skb); |
| v_dbg("pbc 0x%016llX len %d pad_len %d\n", pbc, skb->len, pad_len); |
| err = dd->process_vnic_dma_send(dd, q_idx, vinfo, skb, pbc, pad_len); |
| if (unlikely(err)) { |
| if (err == -ENOMEM) |
| vinfo->stats[q_idx].netstats.tx_fifo_errors++; |
| else if (err != -EBUSY) |
| vinfo->stats[q_idx].netstats.tx_carrier_errors++; |
| } |
| /* remove the header before updating tx counters */ |
| skb_pull(skb, OPA_VNIC_HDR_LEN); |
| |
| if (unlikely(err == -EBUSY)) { |
| hfi1_vnic_maybe_stop_tx(vinfo, q_idx); |
| dev_kfree_skb_any(skb); |
| return NETDEV_TX_BUSY; |
| } |
| |
| tx_finish: |
| /* update tx counters */ |
| hfi1_vnic_update_tx_counters(vinfo, q_idx, skb, err); |
| dev_kfree_skb_any(skb); |
| return NETDEV_TX_OK; |
| } |
| |
| static u16 hfi1_vnic_select_queue(struct net_device *netdev, |
| struct sk_buff *skb, |
| void *accel_priv, |
| select_queue_fallback_t fallback) |
| { |
| struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev); |
| struct opa_vnic_skb_mdata *mdata; |
| struct sdma_engine *sde; |
| |
| mdata = (struct opa_vnic_skb_mdata *)skb->data; |
| sde = sdma_select_engine_vl(vinfo->dd, mdata->entropy, mdata->vl); |
| return sde->this_idx; |
| } |
| |
| /* hfi1_vnic_decap_skb - strip OPA header from the skb (ethernet) packet */ |
| static inline int hfi1_vnic_decap_skb(struct hfi1_vnic_rx_queue *rxq, |
| struct sk_buff *skb) |
| { |
| struct hfi1_vnic_vport_info *vinfo = rxq->vinfo; |
| int max_len = vinfo->netdev->mtu + VLAN_ETH_HLEN; |
| int rc = -EFAULT; |
| |
| skb_pull(skb, OPA_VNIC_HDR_LEN); |
| |
| /* Validate Packet length */ |
| if (unlikely(skb->len > max_len)) |
| vinfo->stats[rxq->idx].rx_oversize++; |
| else if (unlikely(skb->len < ETH_ZLEN)) |
| vinfo->stats[rxq->idx].rx_runt++; |
| else |
| rc = 0; |
| return rc; |
| } |
| |
| static inline struct sk_buff *hfi1_vnic_get_skb(struct hfi1_vnic_rx_queue *rxq) |
| { |
| unsigned char *pad_info; |
| struct sk_buff *skb; |
| |
| skb = skb_dequeue(&rxq->skbq); |
| if (unlikely(!skb)) |
| return NULL; |
| |
| /* remove tail padding and icrc */ |
| pad_info = skb->data + skb->len - 1; |
| skb_trim(skb, (skb->len - OPA_VNIC_ICRC_TAIL_LEN - |
| ((*pad_info) & 0x7))); |
| |
| return skb; |
| } |
| |
| /* hfi1_vnic_handle_rx - handle skb receive */ |
| static void hfi1_vnic_handle_rx(struct hfi1_vnic_rx_queue *rxq, |
| int *work_done, int work_to_do) |
| { |
| struct hfi1_vnic_vport_info *vinfo = rxq->vinfo; |
| struct sk_buff *skb; |
| int rc; |
| |
| while (1) { |
| if (*work_done >= work_to_do) |
| break; |
| |
| skb = hfi1_vnic_get_skb(rxq); |
| if (unlikely(!skb)) |
| break; |
| |
| rc = hfi1_vnic_decap_skb(rxq, skb); |
| /* update rx counters */ |
| hfi1_vnic_update_rx_counters(vinfo, rxq->idx, skb, rc); |
| if (unlikely(rc)) { |
| dev_kfree_skb_any(skb); |
| continue; |
| } |
| |
| skb_checksum_none_assert(skb); |
| skb->protocol = eth_type_trans(skb, rxq->netdev); |
| |
| napi_gro_receive(&rxq->napi, skb); |
| (*work_done)++; |
| } |
| } |
| |
| /* hfi1_vnic_napi - napi receive polling callback function */ |
| static int hfi1_vnic_napi(struct napi_struct *napi, int budget) |
| { |
| struct hfi1_vnic_rx_queue *rxq = container_of(napi, |
| struct hfi1_vnic_rx_queue, napi); |
| struct hfi1_vnic_vport_info *vinfo = rxq->vinfo; |
| int work_done = 0; |
| |
| v_dbg("napi %d budget %d\n", rxq->idx, budget); |
| hfi1_vnic_handle_rx(rxq, &work_done, budget); |
| |
| v_dbg("napi %d work_done %d\n", rxq->idx, work_done); |
| if (work_done < budget) |
| napi_complete(napi); |
| |
| return work_done; |
| } |
| |
| void hfi1_vnic_bypass_rcv(struct hfi1_packet *packet) |
| { |
| struct hfi1_devdata *dd = packet->rcd->dd; |
| struct hfi1_vnic_vport_info *vinfo = NULL; |
| struct hfi1_vnic_rx_queue *rxq; |
| struct sk_buff *skb; |
| int l4_type, vesw_id = -1; |
| u8 q_idx; |
| |
| l4_type = hfi1_16B_get_l4(packet->ebuf); |
| if (likely(l4_type == OPA_16B_L4_ETHR)) { |
| vesw_id = HFI1_VNIC_GET_VESWID(packet->ebuf); |
| vinfo = idr_find(&dd->vnic.vesw_idr, vesw_id); |
| |
| /* |
| * In case of invalid vesw id, count the error on |
| * the first available vport. |
| */ |
| if (unlikely(!vinfo)) { |
| struct hfi1_vnic_vport_info *vinfo_tmp; |
| int id_tmp = 0; |
| |
| vinfo_tmp = idr_get_next(&dd->vnic.vesw_idr, &id_tmp); |
| if (vinfo_tmp) { |
| spin_lock(&vport_cntr_lock); |
| vinfo_tmp->stats[0].netstats.rx_nohandler++; |
| spin_unlock(&vport_cntr_lock); |
| } |
| } |
| } |
| |
| if (unlikely(!vinfo)) { |
| dd_dev_warn(dd, "vnic rcv err: l4 %d vesw id %d ctx %d\n", |
| l4_type, vesw_id, packet->rcd->ctxt); |
| return; |
| } |
| |
| q_idx = packet->rcd->vnic_q_idx; |
| rxq = &vinfo->rxq[q_idx]; |
| if (unlikely(!netif_oper_up(vinfo->netdev))) { |
| vinfo->stats[q_idx].rx_drop_state++; |
| skb_queue_purge(&rxq->skbq); |
| return; |
| } |
| |
| if (unlikely(skb_queue_len(&rxq->skbq) > HFI1_VNIC_RCV_Q_SIZE)) { |
| vinfo->stats[q_idx].netstats.rx_fifo_errors++; |
| return; |
| } |
| |
| skb = netdev_alloc_skb(vinfo->netdev, packet->tlen); |
| if (unlikely(!skb)) { |
| vinfo->stats[q_idx].netstats.rx_fifo_errors++; |
| return; |
| } |
| |
| memcpy(skb->data, packet->ebuf, packet->tlen); |
| skb_put(skb, packet->tlen); |
| skb_queue_tail(&rxq->skbq, skb); |
| |
| if (napi_schedule_prep(&rxq->napi)) { |
| v_dbg("napi %d scheduling\n", q_idx); |
| __napi_schedule(&rxq->napi); |
| } |
| } |
| |
| static int hfi1_vnic_up(struct hfi1_vnic_vport_info *vinfo) |
| { |
| struct hfi1_devdata *dd = vinfo->dd; |
| struct net_device *netdev = vinfo->netdev; |
| int i, rc; |
| |
| /* ensure virtual eth switch id is valid */ |
| if (!vinfo->vesw_id) |
| return -EINVAL; |
| |
| rc = idr_alloc(&dd->vnic.vesw_idr, vinfo, vinfo->vesw_id, |
| vinfo->vesw_id + 1, GFP_NOWAIT); |
| if (rc < 0) |
| return rc; |
| |
| for (i = 0; i < vinfo->num_rx_q; i++) { |
| struct hfi1_vnic_rx_queue *rxq = &vinfo->rxq[i]; |
| |
| skb_queue_head_init(&rxq->skbq); |
| napi_enable(&rxq->napi); |
| } |
| |
| netif_carrier_on(netdev); |
| netif_tx_start_all_queues(netdev); |
| set_bit(HFI1_VNIC_UP, &vinfo->flags); |
| |
| return 0; |
| } |
| |
| static void hfi1_vnic_down(struct hfi1_vnic_vport_info *vinfo) |
| { |
| struct hfi1_devdata *dd = vinfo->dd; |
| u8 i; |
| |
| clear_bit(HFI1_VNIC_UP, &vinfo->flags); |
| netif_carrier_off(vinfo->netdev); |
| netif_tx_disable(vinfo->netdev); |
| idr_remove(&dd->vnic.vesw_idr, vinfo->vesw_id); |
| |
| /* ensure irqs see the change */ |
| hfi1_vnic_synchronize_irq(dd); |
| |
| /* remove unread skbs */ |
| for (i = 0; i < vinfo->num_rx_q; i++) { |
| struct hfi1_vnic_rx_queue *rxq = &vinfo->rxq[i]; |
| |
| napi_disable(&rxq->napi); |
| skb_queue_purge(&rxq->skbq); |
| } |
| } |
| |
| static int hfi1_netdev_open(struct net_device *netdev) |
| { |
| struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev); |
| int rc; |
| |
| mutex_lock(&vinfo->lock); |
| rc = hfi1_vnic_up(vinfo); |
| mutex_unlock(&vinfo->lock); |
| return rc; |
| } |
| |
| static int hfi1_netdev_close(struct net_device *netdev) |
| { |
| struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev); |
| |
| mutex_lock(&vinfo->lock); |
| if (test_bit(HFI1_VNIC_UP, &vinfo->flags)) |
| hfi1_vnic_down(vinfo); |
| mutex_unlock(&vinfo->lock); |
| return 0; |
| } |
| |
| static int hfi1_vnic_allot_ctxt(struct hfi1_devdata *dd, |
| struct hfi1_ctxtdata **vnic_ctxt) |
| { |
| int rc; |
| |
| rc = allocate_vnic_ctxt(dd, vnic_ctxt); |
| if (rc) { |
| dd_dev_err(dd, "vnic ctxt alloc failed %d\n", rc); |
| return rc; |
| } |
| |
| rc = setup_vnic_ctxt(dd, *vnic_ctxt); |
| if (rc) { |
| dd_dev_err(dd, "vnic ctxt setup failed %d\n", rc); |
| deallocate_vnic_ctxt(dd, *vnic_ctxt); |
| *vnic_ctxt = NULL; |
| } |
| |
| return rc; |
| } |
| |
| static int hfi1_vnic_init(struct hfi1_vnic_vport_info *vinfo) |
| { |
| struct hfi1_devdata *dd = vinfo->dd; |
| int i, rc = 0; |
| |
| mutex_lock(&hfi1_mutex); |
| if (!dd->vnic.num_vports) { |
| rc = hfi1_vnic_txreq_init(dd); |
| if (rc) |
| goto txreq_fail; |
| |
| dd->vnic.msix_idx = dd->first_dyn_msix_idx; |
| } |
| |
| for (i = dd->vnic.num_ctxt; i < vinfo->num_rx_q; i++) { |
| rc = hfi1_vnic_allot_ctxt(dd, &dd->vnic.ctxt[i]); |
| if (rc) |
| break; |
| hfi1_rcd_get(dd->vnic.ctxt[i]); |
| dd->vnic.ctxt[i]->vnic_q_idx = i; |
| } |
| |
| if (i < vinfo->num_rx_q) { |
| /* |
| * If required amount of contexts is not |
| * allocated successfully then remaining contexts |
| * are released. |
| */ |
| while (i-- > dd->vnic.num_ctxt) { |
| deallocate_vnic_ctxt(dd, dd->vnic.ctxt[i]); |
| hfi1_rcd_put(dd->vnic.ctxt[i]); |
| dd->vnic.ctxt[i] = NULL; |
| } |
| goto alloc_fail; |
| } |
| |
| if (dd->vnic.num_ctxt != i) { |
| dd->vnic.num_ctxt = i; |
| hfi1_init_vnic_rsm(dd); |
| } |
| |
| dd->vnic.num_vports++; |
| hfi1_vnic_sdma_init(vinfo); |
| alloc_fail: |
| if (!dd->vnic.num_vports) |
| hfi1_vnic_txreq_deinit(dd); |
| txreq_fail: |
| mutex_unlock(&hfi1_mutex); |
| return rc; |
| } |
| |
| static void hfi1_vnic_deinit(struct hfi1_vnic_vport_info *vinfo) |
| { |
| struct hfi1_devdata *dd = vinfo->dd; |
| int i; |
| |
| mutex_lock(&hfi1_mutex); |
| if (--dd->vnic.num_vports == 0) { |
| for (i = 0; i < dd->vnic.num_ctxt; i++) { |
| deallocate_vnic_ctxt(dd, dd->vnic.ctxt[i]); |
| hfi1_rcd_put(dd->vnic.ctxt[i]); |
| dd->vnic.ctxt[i] = NULL; |
| } |
| hfi1_deinit_vnic_rsm(dd); |
| dd->vnic.num_ctxt = 0; |
| hfi1_vnic_txreq_deinit(dd); |
| } |
| mutex_unlock(&hfi1_mutex); |
| } |
| |
| static void hfi1_vnic_set_vesw_id(struct net_device *netdev, int id) |
| { |
| struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev); |
| bool reopen = false; |
| |
| /* |
| * If vesw_id is being changed, and if the vnic port is up, |
| * reset the vnic port to ensure new vesw_id gets picked up |
| */ |
| if (id != vinfo->vesw_id) { |
| mutex_lock(&vinfo->lock); |
| if (test_bit(HFI1_VNIC_UP, &vinfo->flags)) { |
| hfi1_vnic_down(vinfo); |
| reopen = true; |
| } |
| |
| vinfo->vesw_id = id; |
| if (reopen) |
| hfi1_vnic_up(vinfo); |
| |
| mutex_unlock(&vinfo->lock); |
| } |
| } |
| |
| /* netdev ops */ |
| static const struct net_device_ops hfi1_netdev_ops = { |
| .ndo_open = hfi1_netdev_open, |
| .ndo_stop = hfi1_netdev_close, |
| .ndo_start_xmit = hfi1_netdev_start_xmit, |
| .ndo_select_queue = hfi1_vnic_select_queue, |
| .ndo_get_stats64 = hfi1_vnic_get_stats64, |
| }; |
| |
| static void hfi1_vnic_free_rn(struct net_device *netdev) |
| { |
| struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev); |
| |
| hfi1_vnic_deinit(vinfo); |
| mutex_destroy(&vinfo->lock); |
| free_netdev(netdev); |
| } |
| |
| struct net_device *hfi1_vnic_alloc_rn(struct ib_device *device, |
| u8 port_num, |
| enum rdma_netdev_t type, |
| const char *name, |
| unsigned char name_assign_type, |
| void (*setup)(struct net_device *)) |
| { |
| struct hfi1_devdata *dd = dd_from_ibdev(device); |
| struct hfi1_vnic_vport_info *vinfo; |
| struct net_device *netdev; |
| struct rdma_netdev *rn; |
| int i, size, rc; |
| |
| if (!dd->num_vnic_contexts) |
| return ERR_PTR(-ENOMEM); |
| |
| if (!port_num || (port_num > dd->num_pports)) |
| return ERR_PTR(-EINVAL); |
| |
| if (type != RDMA_NETDEV_OPA_VNIC) |
| return ERR_PTR(-EOPNOTSUPP); |
| |
| size = sizeof(struct opa_vnic_rdma_netdev) + sizeof(*vinfo); |
| netdev = alloc_netdev_mqs(size, name, name_assign_type, setup, |
| dd->chip_sdma_engines, dd->num_vnic_contexts); |
| if (!netdev) |
| return ERR_PTR(-ENOMEM); |
| |
| rn = netdev_priv(netdev); |
| vinfo = opa_vnic_dev_priv(netdev); |
| vinfo->dd = dd; |
| vinfo->num_tx_q = dd->chip_sdma_engines; |
| vinfo->num_rx_q = dd->num_vnic_contexts; |
| vinfo->netdev = netdev; |
| rn->free_rdma_netdev = hfi1_vnic_free_rn; |
| rn->set_id = hfi1_vnic_set_vesw_id; |
| |
| netdev->features = NETIF_F_HIGHDMA | NETIF_F_SG; |
| netdev->hw_features = netdev->features; |
| netdev->vlan_features = netdev->features; |
| netdev->watchdog_timeo = msecs_to_jiffies(HFI_TX_TIMEOUT_MS); |
| netdev->netdev_ops = &hfi1_netdev_ops; |
| mutex_init(&vinfo->lock); |
| |
| for (i = 0; i < vinfo->num_rx_q; i++) { |
| struct hfi1_vnic_rx_queue *rxq = &vinfo->rxq[i]; |
| |
| rxq->idx = i; |
| rxq->vinfo = vinfo; |
| rxq->netdev = netdev; |
| netif_napi_add(netdev, &rxq->napi, hfi1_vnic_napi, 64); |
| } |
| |
| rc = hfi1_vnic_init(vinfo); |
| if (rc) |
| goto init_fail; |
| |
| return netdev; |
| init_fail: |
| mutex_destroy(&vinfo->lock); |
| free_netdev(netdev); |
| return ERR_PTR(rc); |
| } |