123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858 |
- /*
- * Copyright(c) 2017 - 2018 Intel Corporation.
- *
- * This file is provided under a dual BSD/GPLv2 license. When using or
- * redistributing this file, you may do so under either license.
- *
- * GPL LICENSE SUMMARY
- *
- * This program is free software; you can redistribute it and/or modify
- * it under the terms of version 2 of the GNU General Public License as
- * published by the Free Software Foundation.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- * General Public License for more details.
- *
- * BSD LICENSE
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * - Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- * - Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- * - Neither the name of Intel Corporation nor the names of its
- * contributors may be used to endorse or promote products derived
- * from this software without specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
- * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
- * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
- * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
- * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- */
- /*
- * This file contains HFI1 support for VNIC functionality
- */
- #include <linux/io.h>
- #include <linux/if_vlan.h>
- #include "vnic.h"
- #define HFI_TX_TIMEOUT_MS 1000
- #define HFI1_VNIC_RCV_Q_SIZE 1024
- #define HFI1_VNIC_UP 0
- static DEFINE_SPINLOCK(vport_cntr_lock);
- static int setup_vnic_ctxt(struct hfi1_devdata *dd, struct hfi1_ctxtdata *uctxt)
- {
- unsigned int rcvctrl_ops = 0;
- int ret;
- uctxt->do_interrupt = &handle_receive_interrupt;
- /* Now allocate the RcvHdr queue and eager buffers. */
- ret = hfi1_create_rcvhdrq(dd, uctxt);
- if (ret)
- goto done;
- ret = hfi1_setup_eagerbufs(uctxt);
- if (ret)
- goto done;
- if (uctxt->rcvhdrtail_kvaddr)
- clear_rcvhdrtail(uctxt);
- rcvctrl_ops = HFI1_RCVCTRL_CTXT_ENB;
- rcvctrl_ops |= HFI1_RCVCTRL_INTRAVAIL_ENB;
- if (!HFI1_CAP_KGET_MASK(uctxt->flags, MULTI_PKT_EGR))
- rcvctrl_ops |= HFI1_RCVCTRL_ONE_PKT_EGR_ENB;
- if (HFI1_CAP_KGET_MASK(uctxt->flags, NODROP_EGR_FULL))
- rcvctrl_ops |= HFI1_RCVCTRL_NO_EGR_DROP_ENB;
- if (HFI1_CAP_KGET_MASK(uctxt->flags, NODROP_RHQ_FULL))
- rcvctrl_ops |= HFI1_RCVCTRL_NO_RHQ_DROP_ENB;
- if (HFI1_CAP_KGET_MASK(uctxt->flags, DMA_RTAIL))
- rcvctrl_ops |= HFI1_RCVCTRL_TAILUPD_ENB;
- hfi1_rcvctrl(uctxt->dd, rcvctrl_ops, uctxt);
- done:
- return ret;
- }
- static int allocate_vnic_ctxt(struct hfi1_devdata *dd,
- struct hfi1_ctxtdata **vnic_ctxt)
- {
- struct hfi1_ctxtdata *uctxt;
- int ret;
- if (dd->flags & HFI1_FROZEN)
- return -EIO;
- ret = hfi1_create_ctxtdata(dd->pport, dd->node, &uctxt);
- if (ret < 0) {
- dd_dev_err(dd, "Unable to create ctxtdata, failing open\n");
- return -ENOMEM;
- }
- uctxt->flags = HFI1_CAP_KGET(MULTI_PKT_EGR) |
- HFI1_CAP_KGET(NODROP_RHQ_FULL) |
- HFI1_CAP_KGET(NODROP_EGR_FULL) |
- HFI1_CAP_KGET(DMA_RTAIL);
- uctxt->seq_cnt = 1;
- uctxt->is_vnic = true;
- hfi1_set_vnic_msix_info(uctxt);
- hfi1_stats.sps_ctxts++;
- dd_dev_dbg(dd, "created vnic context %d\n", uctxt->ctxt);
- *vnic_ctxt = uctxt;
- return 0;
- }
- static void deallocate_vnic_ctxt(struct hfi1_devdata *dd,
- struct hfi1_ctxtdata *uctxt)
- {
- dd_dev_dbg(dd, "closing vnic context %d\n", uctxt->ctxt);
- flush_wc();
- hfi1_reset_vnic_msix_info(uctxt);
- /*
- * Disable receive context and interrupt available, reset all
- * RcvCtxtCtrl bits to default values.
- */
- hfi1_rcvctrl(dd, HFI1_RCVCTRL_CTXT_DIS |
- HFI1_RCVCTRL_TIDFLOW_DIS |
- HFI1_RCVCTRL_INTRAVAIL_DIS |
- HFI1_RCVCTRL_ONE_PKT_EGR_DIS |
- HFI1_RCVCTRL_NO_RHQ_DROP_DIS |
- HFI1_RCVCTRL_NO_EGR_DROP_DIS, uctxt);
- uctxt->event_flags = 0;
- hfi1_clear_tids(uctxt);
- hfi1_clear_ctxt_pkey(dd, uctxt);
- hfi1_stats.sps_ctxts--;
- hfi1_free_ctxt(uctxt);
- }
- void hfi1_vnic_setup(struct hfi1_devdata *dd)
- {
- idr_init(&dd->vnic.vesw_idr);
- }
- void hfi1_vnic_cleanup(struct hfi1_devdata *dd)
- {
- idr_destroy(&dd->vnic.vesw_idr);
- }
- #define SUM_GRP_COUNTERS(stats, qstats, x_grp) do { \
- u64 *src64, *dst64; \
- for (src64 = &qstats->x_grp.unicast, \
- dst64 = &stats->x_grp.unicast; \
- dst64 <= &stats->x_grp.s_1519_max;) { \
- *dst64++ += *src64++; \
- } \
- } while (0)
- /* hfi1_vnic_update_stats - update statistics */
- static void hfi1_vnic_update_stats(struct hfi1_vnic_vport_info *vinfo,
- struct opa_vnic_stats *stats)
- {
- struct net_device *netdev = vinfo->netdev;
- u8 i;
- /* add tx counters on different queues */
- for (i = 0; i < vinfo->num_tx_q; i++) {
- struct opa_vnic_stats *qstats = &vinfo->stats[i];
- struct rtnl_link_stats64 *qnstats = &vinfo->stats[i].netstats;
- stats->netstats.tx_fifo_errors += qnstats->tx_fifo_errors;
- stats->netstats.tx_carrier_errors += qnstats->tx_carrier_errors;
- stats->tx_drop_state += qstats->tx_drop_state;
- stats->tx_dlid_zero += qstats->tx_dlid_zero;
- SUM_GRP_COUNTERS(stats, qstats, tx_grp);
- stats->netstats.tx_packets += qnstats->tx_packets;
- stats->netstats.tx_bytes += qnstats->tx_bytes;
- }
- /* add rx counters on different queues */
- for (i = 0; i < vinfo->num_rx_q; i++) {
- struct opa_vnic_stats *qstats = &vinfo->stats[i];
- struct rtnl_link_stats64 *qnstats = &vinfo->stats[i].netstats;
- stats->netstats.rx_fifo_errors += qnstats->rx_fifo_errors;
- stats->netstats.rx_nohandler += qnstats->rx_nohandler;
- stats->rx_drop_state += qstats->rx_drop_state;
- stats->rx_oversize += qstats->rx_oversize;
- stats->rx_runt += qstats->rx_runt;
- SUM_GRP_COUNTERS(stats, qstats, rx_grp);
- stats->netstats.rx_packets += qnstats->rx_packets;
- stats->netstats.rx_bytes += qnstats->rx_bytes;
- }
- stats->netstats.tx_errors = stats->netstats.tx_fifo_errors +
- stats->netstats.tx_carrier_errors +
- stats->tx_drop_state + stats->tx_dlid_zero;
- stats->netstats.tx_dropped = stats->netstats.tx_errors;
- stats->netstats.rx_errors = stats->netstats.rx_fifo_errors +
- stats->netstats.rx_nohandler +
- stats->rx_drop_state + stats->rx_oversize +
- stats->rx_runt;
- stats->netstats.rx_dropped = stats->netstats.rx_errors;
- netdev->stats.tx_packets = stats->netstats.tx_packets;
- netdev->stats.tx_bytes = stats->netstats.tx_bytes;
- netdev->stats.tx_fifo_errors = stats->netstats.tx_fifo_errors;
- netdev->stats.tx_carrier_errors = stats->netstats.tx_carrier_errors;
- netdev->stats.tx_errors = stats->netstats.tx_errors;
- netdev->stats.tx_dropped = stats->netstats.tx_dropped;
- netdev->stats.rx_packets = stats->netstats.rx_packets;
- netdev->stats.rx_bytes = stats->netstats.rx_bytes;
- netdev->stats.rx_fifo_errors = stats->netstats.rx_fifo_errors;
- netdev->stats.multicast = stats->rx_grp.mcastbcast;
- netdev->stats.rx_length_errors = stats->rx_oversize + stats->rx_runt;
- netdev->stats.rx_errors = stats->netstats.rx_errors;
- netdev->stats.rx_dropped = stats->netstats.rx_dropped;
- }
- /* update_len_counters - update pkt's len histogram counters */
- static inline void update_len_counters(struct opa_vnic_grp_stats *grp,
- int len)
- {
- /* account for 4 byte FCS */
- if (len >= 1515)
- grp->s_1519_max++;
- else if (len >= 1020)
- grp->s_1024_1518++;
- else if (len >= 508)
- grp->s_512_1023++;
- else if (len >= 252)
- grp->s_256_511++;
- else if (len >= 124)
- grp->s_128_255++;
- else if (len >= 61)
- grp->s_65_127++;
- else
- grp->s_64++;
- }
- /* hfi1_vnic_update_tx_counters - update transmit counters */
- static void hfi1_vnic_update_tx_counters(struct hfi1_vnic_vport_info *vinfo,
- u8 q_idx, struct sk_buff *skb, int err)
- {
- struct ethhdr *mac_hdr = (struct ethhdr *)skb_mac_header(skb);
- struct opa_vnic_stats *stats = &vinfo->stats[q_idx];
- struct opa_vnic_grp_stats *tx_grp = &stats->tx_grp;
- u16 vlan_tci;
- stats->netstats.tx_packets++;
- stats->netstats.tx_bytes += skb->len + ETH_FCS_LEN;
- update_len_counters(tx_grp, skb->len);
- /* rest of the counts are for good packets only */
- if (unlikely(err))
- return;
- if (is_multicast_ether_addr(mac_hdr->h_dest))
- tx_grp->mcastbcast++;
- else
- tx_grp->unicast++;
- if (!__vlan_get_tag(skb, &vlan_tci))
- tx_grp->vlan++;
- else
- tx_grp->untagged++;
- }
- /* hfi1_vnic_update_rx_counters - update receive counters */
- static void hfi1_vnic_update_rx_counters(struct hfi1_vnic_vport_info *vinfo,
- u8 q_idx, struct sk_buff *skb, int err)
- {
- struct ethhdr *mac_hdr = (struct ethhdr *)skb->data;
- struct opa_vnic_stats *stats = &vinfo->stats[q_idx];
- struct opa_vnic_grp_stats *rx_grp = &stats->rx_grp;
- u16 vlan_tci;
- stats->netstats.rx_packets++;
- stats->netstats.rx_bytes += skb->len + ETH_FCS_LEN;
- update_len_counters(rx_grp, skb->len);
- /* rest of the counts are for good packets only */
- if (unlikely(err))
- return;
- if (is_multicast_ether_addr(mac_hdr->h_dest))
- rx_grp->mcastbcast++;
- else
- rx_grp->unicast++;
- if (!__vlan_get_tag(skb, &vlan_tci))
- rx_grp->vlan++;
- else
- rx_grp->untagged++;
- }
- /* This function is overloaded for opa_vnic specific implementation */
- static void hfi1_vnic_get_stats64(struct net_device *netdev,
- struct rtnl_link_stats64 *stats)
- {
- struct opa_vnic_stats *vstats = (struct opa_vnic_stats *)stats;
- struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev);
- hfi1_vnic_update_stats(vinfo, vstats);
- }
- static u64 create_bypass_pbc(u32 vl, u32 dw_len)
- {
- u64 pbc;
- pbc = ((u64)PBC_IHCRC_NONE << PBC_INSERT_HCRC_SHIFT)
- | PBC_INSERT_BYPASS_ICRC | PBC_CREDIT_RETURN
- | PBC_PACKET_BYPASS
- | ((vl & PBC_VL_MASK) << PBC_VL_SHIFT)
- | (dw_len & PBC_LENGTH_DWS_MASK) << PBC_LENGTH_DWS_SHIFT;
- return pbc;
- }
- /* hfi1_vnic_maybe_stop_tx - stop tx queue if required */
- static void hfi1_vnic_maybe_stop_tx(struct hfi1_vnic_vport_info *vinfo,
- u8 q_idx)
- {
- netif_stop_subqueue(vinfo->netdev, q_idx);
- if (!hfi1_vnic_sdma_write_avail(vinfo, q_idx))
- return;
- netif_start_subqueue(vinfo->netdev, q_idx);
- }
- static netdev_tx_t hfi1_netdev_start_xmit(struct sk_buff *skb,
- struct net_device *netdev)
- {
- struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev);
- u8 pad_len, q_idx = skb->queue_mapping;
- struct hfi1_devdata *dd = vinfo->dd;
- struct opa_vnic_skb_mdata *mdata;
- u32 pkt_len, total_len;
- int err = -EINVAL;
- u64 pbc;
- v_dbg("xmit: queue %d skb len %d\n", q_idx, skb->len);
- if (unlikely(!netif_oper_up(netdev))) {
- vinfo->stats[q_idx].tx_drop_state++;
- goto tx_finish;
- }
- /* take out meta data */
- mdata = (struct opa_vnic_skb_mdata *)skb->data;
- skb_pull(skb, sizeof(*mdata));
- if (unlikely(mdata->flags & OPA_VNIC_SKB_MDATA_ENCAP_ERR)) {
- vinfo->stats[q_idx].tx_dlid_zero++;
- goto tx_finish;
- }
- /* add tail padding (for 8 bytes size alignment) and icrc */
- pad_len = -(skb->len + OPA_VNIC_ICRC_TAIL_LEN) & 0x7;
- pad_len += OPA_VNIC_ICRC_TAIL_LEN;
- /*
- * pkt_len is how much data we have to write, includes header and data.
- * total_len is length of the packet in Dwords plus the PBC should not
- * include the CRC.
- */
- pkt_len = (skb->len + pad_len) >> 2;
- total_len = pkt_len + 2; /* PBC + packet */
- pbc = create_bypass_pbc(mdata->vl, total_len);
- skb_get(skb);
- v_dbg("pbc 0x%016llX len %d pad_len %d\n", pbc, skb->len, pad_len);
- err = dd->process_vnic_dma_send(dd, q_idx, vinfo, skb, pbc, pad_len);
- if (unlikely(err)) {
- if (err == -ENOMEM)
- vinfo->stats[q_idx].netstats.tx_fifo_errors++;
- else if (err != -EBUSY)
- vinfo->stats[q_idx].netstats.tx_carrier_errors++;
- }
- /* remove the header before updating tx counters */
- skb_pull(skb, OPA_VNIC_HDR_LEN);
- if (unlikely(err == -EBUSY)) {
- hfi1_vnic_maybe_stop_tx(vinfo, q_idx);
- dev_kfree_skb_any(skb);
- return NETDEV_TX_BUSY;
- }
- tx_finish:
- /* update tx counters */
- hfi1_vnic_update_tx_counters(vinfo, q_idx, skb, err);
- dev_kfree_skb_any(skb);
- return NETDEV_TX_OK;
- }
- static u16 hfi1_vnic_select_queue(struct net_device *netdev,
- struct sk_buff *skb,
- struct net_device *sb_dev,
- select_queue_fallback_t fallback)
- {
- struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev);
- struct opa_vnic_skb_mdata *mdata;
- struct sdma_engine *sde;
- mdata = (struct opa_vnic_skb_mdata *)skb->data;
- sde = sdma_select_engine_vl(vinfo->dd, mdata->entropy, mdata->vl);
- return sde->this_idx;
- }
- /* hfi1_vnic_decap_skb - strip OPA header from the skb (ethernet) packet */
- static inline int hfi1_vnic_decap_skb(struct hfi1_vnic_rx_queue *rxq,
- struct sk_buff *skb)
- {
- struct hfi1_vnic_vport_info *vinfo = rxq->vinfo;
- int max_len = vinfo->netdev->mtu + VLAN_ETH_HLEN;
- int rc = -EFAULT;
- skb_pull(skb, OPA_VNIC_HDR_LEN);
- /* Validate Packet length */
- if (unlikely(skb->len > max_len))
- vinfo->stats[rxq->idx].rx_oversize++;
- else if (unlikely(skb->len < ETH_ZLEN))
- vinfo->stats[rxq->idx].rx_runt++;
- else
- rc = 0;
- return rc;
- }
- static inline struct sk_buff *hfi1_vnic_get_skb(struct hfi1_vnic_rx_queue *rxq)
- {
- unsigned char *pad_info;
- struct sk_buff *skb;
- skb = skb_dequeue(&rxq->skbq);
- if (unlikely(!skb))
- return NULL;
- /* remove tail padding and icrc */
- pad_info = skb->data + skb->len - 1;
- skb_trim(skb, (skb->len - OPA_VNIC_ICRC_TAIL_LEN -
- ((*pad_info) & 0x7)));
- return skb;
- }
- /* hfi1_vnic_handle_rx - handle skb receive */
- static void hfi1_vnic_handle_rx(struct hfi1_vnic_rx_queue *rxq,
- int *work_done, int work_to_do)
- {
- struct hfi1_vnic_vport_info *vinfo = rxq->vinfo;
- struct sk_buff *skb;
- int rc;
- while (1) {
- if (*work_done >= work_to_do)
- break;
- skb = hfi1_vnic_get_skb(rxq);
- if (unlikely(!skb))
- break;
- rc = hfi1_vnic_decap_skb(rxq, skb);
- /* update rx counters */
- hfi1_vnic_update_rx_counters(vinfo, rxq->idx, skb, rc);
- if (unlikely(rc)) {
- dev_kfree_skb_any(skb);
- continue;
- }
- skb_checksum_none_assert(skb);
- skb->protocol = eth_type_trans(skb, rxq->netdev);
- napi_gro_receive(&rxq->napi, skb);
- (*work_done)++;
- }
- }
- /* hfi1_vnic_napi - napi receive polling callback function */
- static int hfi1_vnic_napi(struct napi_struct *napi, int budget)
- {
- struct hfi1_vnic_rx_queue *rxq = container_of(napi,
- struct hfi1_vnic_rx_queue, napi);
- struct hfi1_vnic_vport_info *vinfo = rxq->vinfo;
- int work_done = 0;
- v_dbg("napi %d budget %d\n", rxq->idx, budget);
- hfi1_vnic_handle_rx(rxq, &work_done, budget);
- v_dbg("napi %d work_done %d\n", rxq->idx, work_done);
- if (work_done < budget)
- napi_complete(napi);
- return work_done;
- }
- void hfi1_vnic_bypass_rcv(struct hfi1_packet *packet)
- {
- struct hfi1_devdata *dd = packet->rcd->dd;
- struct hfi1_vnic_vport_info *vinfo = NULL;
- struct hfi1_vnic_rx_queue *rxq;
- struct sk_buff *skb;
- int l4_type, vesw_id = -1;
- u8 q_idx;
- l4_type = hfi1_16B_get_l4(packet->ebuf);
- if (likely(l4_type == OPA_16B_L4_ETHR)) {
- vesw_id = HFI1_VNIC_GET_VESWID(packet->ebuf);
- vinfo = idr_find(&dd->vnic.vesw_idr, vesw_id);
- /*
- * In case of invalid vesw id, count the error on
- * the first available vport.
- */
- if (unlikely(!vinfo)) {
- struct hfi1_vnic_vport_info *vinfo_tmp;
- int id_tmp = 0;
- vinfo_tmp = idr_get_next(&dd->vnic.vesw_idr, &id_tmp);
- if (vinfo_tmp) {
- spin_lock(&vport_cntr_lock);
- vinfo_tmp->stats[0].netstats.rx_nohandler++;
- spin_unlock(&vport_cntr_lock);
- }
- }
- }
- if (unlikely(!vinfo)) {
- dd_dev_warn(dd, "vnic rcv err: l4 %d vesw id %d ctx %d\n",
- l4_type, vesw_id, packet->rcd->ctxt);
- return;
- }
- q_idx = packet->rcd->vnic_q_idx;
- rxq = &vinfo->rxq[q_idx];
- if (unlikely(!netif_oper_up(vinfo->netdev))) {
- vinfo->stats[q_idx].rx_drop_state++;
- skb_queue_purge(&rxq->skbq);
- return;
- }
- if (unlikely(skb_queue_len(&rxq->skbq) > HFI1_VNIC_RCV_Q_SIZE)) {
- vinfo->stats[q_idx].netstats.rx_fifo_errors++;
- return;
- }
- skb = netdev_alloc_skb(vinfo->netdev, packet->tlen);
- if (unlikely(!skb)) {
- vinfo->stats[q_idx].netstats.rx_fifo_errors++;
- return;
- }
- memcpy(skb->data, packet->ebuf, packet->tlen);
- skb_put(skb, packet->tlen);
- skb_queue_tail(&rxq->skbq, skb);
- if (napi_schedule_prep(&rxq->napi)) {
- v_dbg("napi %d scheduling\n", q_idx);
- __napi_schedule(&rxq->napi);
- }
- }
- static int hfi1_vnic_up(struct hfi1_vnic_vport_info *vinfo)
- {
- struct hfi1_devdata *dd = vinfo->dd;
- struct net_device *netdev = vinfo->netdev;
- int i, rc;
- /* ensure virtual eth switch id is valid */
- if (!vinfo->vesw_id)
- return -EINVAL;
- rc = idr_alloc(&dd->vnic.vesw_idr, vinfo, vinfo->vesw_id,
- vinfo->vesw_id + 1, GFP_NOWAIT);
- if (rc < 0)
- return rc;
- for (i = 0; i < vinfo->num_rx_q; i++) {
- struct hfi1_vnic_rx_queue *rxq = &vinfo->rxq[i];
- skb_queue_head_init(&rxq->skbq);
- napi_enable(&rxq->napi);
- }
- netif_carrier_on(netdev);
- netif_tx_start_all_queues(netdev);
- set_bit(HFI1_VNIC_UP, &vinfo->flags);
- return 0;
- }
- static void hfi1_vnic_down(struct hfi1_vnic_vport_info *vinfo)
- {
- struct hfi1_devdata *dd = vinfo->dd;
- u8 i;
- clear_bit(HFI1_VNIC_UP, &vinfo->flags);
- netif_carrier_off(vinfo->netdev);
- netif_tx_disable(vinfo->netdev);
- idr_remove(&dd->vnic.vesw_idr, vinfo->vesw_id);
- /* ensure irqs see the change */
- hfi1_vnic_synchronize_irq(dd);
- /* remove unread skbs */
- for (i = 0; i < vinfo->num_rx_q; i++) {
- struct hfi1_vnic_rx_queue *rxq = &vinfo->rxq[i];
- napi_disable(&rxq->napi);
- skb_queue_purge(&rxq->skbq);
- }
- }
- static int hfi1_netdev_open(struct net_device *netdev)
- {
- struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev);
- int rc;
- mutex_lock(&vinfo->lock);
- rc = hfi1_vnic_up(vinfo);
- mutex_unlock(&vinfo->lock);
- return rc;
- }
- static int hfi1_netdev_close(struct net_device *netdev)
- {
- struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev);
- mutex_lock(&vinfo->lock);
- if (test_bit(HFI1_VNIC_UP, &vinfo->flags))
- hfi1_vnic_down(vinfo);
- mutex_unlock(&vinfo->lock);
- return 0;
- }
- static int hfi1_vnic_allot_ctxt(struct hfi1_devdata *dd,
- struct hfi1_ctxtdata **vnic_ctxt)
- {
- int rc;
- rc = allocate_vnic_ctxt(dd, vnic_ctxt);
- if (rc) {
- dd_dev_err(dd, "vnic ctxt alloc failed %d\n", rc);
- return rc;
- }
- rc = setup_vnic_ctxt(dd, *vnic_ctxt);
- if (rc) {
- dd_dev_err(dd, "vnic ctxt setup failed %d\n", rc);
- deallocate_vnic_ctxt(dd, *vnic_ctxt);
- *vnic_ctxt = NULL;
- }
- return rc;
- }
- static int hfi1_vnic_init(struct hfi1_vnic_vport_info *vinfo)
- {
- struct hfi1_devdata *dd = vinfo->dd;
- int i, rc = 0;
- mutex_lock(&hfi1_mutex);
- if (!dd->vnic.num_vports) {
- rc = hfi1_vnic_txreq_init(dd);
- if (rc)
- goto txreq_fail;
- dd->vnic.msix_idx = dd->first_dyn_msix_idx;
- }
- for (i = dd->vnic.num_ctxt; i < vinfo->num_rx_q; i++) {
- rc = hfi1_vnic_allot_ctxt(dd, &dd->vnic.ctxt[i]);
- if (rc)
- break;
- hfi1_rcd_get(dd->vnic.ctxt[i]);
- dd->vnic.ctxt[i]->vnic_q_idx = i;
- }
- if (i < vinfo->num_rx_q) {
- /*
- * If required amount of contexts is not
- * allocated successfully then remaining contexts
- * are released.
- */
- while (i-- > dd->vnic.num_ctxt) {
- deallocate_vnic_ctxt(dd, dd->vnic.ctxt[i]);
- hfi1_rcd_put(dd->vnic.ctxt[i]);
- dd->vnic.ctxt[i] = NULL;
- }
- goto alloc_fail;
- }
- if (dd->vnic.num_ctxt != i) {
- dd->vnic.num_ctxt = i;
- hfi1_init_vnic_rsm(dd);
- }
- dd->vnic.num_vports++;
- hfi1_vnic_sdma_init(vinfo);
- alloc_fail:
- if (!dd->vnic.num_vports)
- hfi1_vnic_txreq_deinit(dd);
- txreq_fail:
- mutex_unlock(&hfi1_mutex);
- return rc;
- }
- static void hfi1_vnic_deinit(struct hfi1_vnic_vport_info *vinfo)
- {
- struct hfi1_devdata *dd = vinfo->dd;
- int i;
- mutex_lock(&hfi1_mutex);
- if (--dd->vnic.num_vports == 0) {
- for (i = 0; i < dd->vnic.num_ctxt; i++) {
- deallocate_vnic_ctxt(dd, dd->vnic.ctxt[i]);
- hfi1_rcd_put(dd->vnic.ctxt[i]);
- dd->vnic.ctxt[i] = NULL;
- }
- hfi1_deinit_vnic_rsm(dd);
- dd->vnic.num_ctxt = 0;
- hfi1_vnic_txreq_deinit(dd);
- }
- mutex_unlock(&hfi1_mutex);
- }
- static void hfi1_vnic_set_vesw_id(struct net_device *netdev, int id)
- {
- struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev);
- bool reopen = false;
- /*
- * If vesw_id is being changed, and if the vnic port is up,
- * reset the vnic port to ensure new vesw_id gets picked up
- */
- if (id != vinfo->vesw_id) {
- mutex_lock(&vinfo->lock);
- if (test_bit(HFI1_VNIC_UP, &vinfo->flags)) {
- hfi1_vnic_down(vinfo);
- reopen = true;
- }
- vinfo->vesw_id = id;
- if (reopen)
- hfi1_vnic_up(vinfo);
- mutex_unlock(&vinfo->lock);
- }
- }
- /* netdev ops */
- static const struct net_device_ops hfi1_netdev_ops = {
- .ndo_open = hfi1_netdev_open,
- .ndo_stop = hfi1_netdev_close,
- .ndo_start_xmit = hfi1_netdev_start_xmit,
- .ndo_select_queue = hfi1_vnic_select_queue,
- .ndo_get_stats64 = hfi1_vnic_get_stats64,
- };
- static void hfi1_vnic_free_rn(struct net_device *netdev)
- {
- struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev);
- hfi1_vnic_deinit(vinfo);
- mutex_destroy(&vinfo->lock);
- free_netdev(netdev);
- }
- struct net_device *hfi1_vnic_alloc_rn(struct ib_device *device,
- u8 port_num,
- enum rdma_netdev_t type,
- const char *name,
- unsigned char name_assign_type,
- void (*setup)(struct net_device *))
- {
- struct hfi1_devdata *dd = dd_from_ibdev(device);
- struct hfi1_vnic_vport_info *vinfo;
- struct net_device *netdev;
- struct rdma_netdev *rn;
- int i, size, rc;
- if (!dd->num_vnic_contexts)
- return ERR_PTR(-ENOMEM);
- if (!port_num || (port_num > dd->num_pports))
- return ERR_PTR(-EINVAL);
- if (type != RDMA_NETDEV_OPA_VNIC)
- return ERR_PTR(-EOPNOTSUPP);
- size = sizeof(struct opa_vnic_rdma_netdev) + sizeof(*vinfo);
- netdev = alloc_netdev_mqs(size, name, name_assign_type, setup,
- chip_sdma_engines(dd), dd->num_vnic_contexts);
- if (!netdev)
- return ERR_PTR(-ENOMEM);
- rn = netdev_priv(netdev);
- vinfo = opa_vnic_dev_priv(netdev);
- vinfo->dd = dd;
- vinfo->num_tx_q = chip_sdma_engines(dd);
- vinfo->num_rx_q = dd->num_vnic_contexts;
- vinfo->netdev = netdev;
- rn->free_rdma_netdev = hfi1_vnic_free_rn;
- rn->set_id = hfi1_vnic_set_vesw_id;
- netdev->features = NETIF_F_HIGHDMA | NETIF_F_SG;
- netdev->hw_features = netdev->features;
- netdev->vlan_features = netdev->features;
- netdev->watchdog_timeo = msecs_to_jiffies(HFI_TX_TIMEOUT_MS);
- netdev->netdev_ops = &hfi1_netdev_ops;
- mutex_init(&vinfo->lock);
- for (i = 0; i < vinfo->num_rx_q; i++) {
- struct hfi1_vnic_rx_queue *rxq = &vinfo->rxq[i];
- rxq->idx = i;
- rxq->vinfo = vinfo;
- rxq->netdev = netdev;
- netif_napi_add(netdev, &rxq->napi, hfi1_vnic_napi, 64);
- }
- rc = hfi1_vnic_init(vinfo);
- if (rc)
- goto init_fail;
- return netdev;
- init_fail:
- mutex_destroy(&vinfo->lock);
- free_netdev(netdev);
- return ERR_PTR(rc);
- }
|