summaryrefslogtreecommitdiffstats
path: root/sys/pci/if_ste.c
diff options
context:
space:
mode:
authorambrisko <ambrisko@FreeBSD.org>2002-08-07 22:31:27 +0000
committerambrisko <ambrisko@FreeBSD.org>2002-08-07 22:31:27 +0000
commit50ff7d43747a1dd2374b40b3ceb1fa3b7d3299cd (patch)
tree501f988d59778f5ebf95773846f122b048aed007 /sys/pci/if_ste.c
parent0516dc643cb4cc01ddf0939879e53f7aca690bcf (diff)
downloadFreeBSD-src-50ff7d43747a1dd2374b40b3ceb1fa3b7d3299cd.zip
FreeBSD-src-50ff7d43747a1dd2374b40b3ceb1fa3b7d3299cd.tar.gz
Fixes for the D-Link DFE-580 card.
This is pretty much fixes any issue I can find: - Watchdog timeouts were due to starting the TX DMA engine before we had a packet ready for it. So the first packet sent never got out only if we sent more then one packet at a time did the others make it out and not blow up. Of course reseting the chip then caused us not to transmit the first packet again ie. catch-22. This required logic changes. - Combine interrupts on TX packets being queued up. - Don't keep running around the RX ring since we might get out of sync so only go around once per receive - Let the RX engine recover via the poll interface which is similar to the TX interface. This way the chip wakes up with no effort when we read enough packets. - Do better hand-shaking on RX & TX packets so they don't start of to soon. - Force a duplex setting when the link comes up after an ste_init or it will default to half-duplex and be really slow. This only happens on subsequent ste_init. The first one worked. - Don't call stat_update for every overflow. We only monitor the collisions so the tick interval is good enough for that. Just read in the collision stats to minimize bus reads. - Don't read the miibus every tick since it uses delays and delays are not good for performance. - Tie link events directly to the miibus code so the port gets set correctly if someone changes the port settings. - Reduce the extreme number of {R,T}FD's. They would consume 130K of kernel memory for each NIC. - Set the TX_THRESH to wait for the DMA engine to complete before running the TX FIFO. This hurts peak TX performance but under bi-directional load the DMA engine can't keep up with the FIFO. Testing shows that we end up in the case anyways (a la dc(4) issues but worse since the RX engine hogs everything). - When stopping the card do a reset since the reset verifies the card has stopped. Otherwise on heavy RX load the RX DMA engine is still stuffing packets into memory. If that happens after we free the DMA area memory bits get scribled in memory and bad things happen. This card still has seemingly unfixable issues under heavy RX load in which the card takes over the PCI bus. Sponsored by: Vernier Networks MFC after: 1 week
Diffstat (limited to 'sys/pci/if_ste.c')
-rw-r--r--sys/pci/if_ste.c172
1 files changed, 96 insertions, 76 deletions
diff --git a/sys/pci/if_ste.c b/sys/pci/if_ste.c
index 6b65dcf..73f218c 100644
--- a/sys/pci/if_ste.c
+++ b/sys/pci/if_ste.c
@@ -45,6 +45,7 @@
#include <net/ethernet.h>
#include <net/if_dl.h>
#include <net/if_media.h>
+#include <net/if_vlan_var.h>
#include <net/bpf.h>
@@ -643,6 +644,10 @@ static void ste_intr(xsc)
ste_stats_update(sc);
}
+ if (status & STE_ISR_LINKEVENT)
+ mii_pollstat(device_get_softc(sc->ste_miibus));
+
+
if (status & STE_ISR_HOSTERR) {
ste_reset(sc);
ste_init(sc);
@@ -671,14 +676,17 @@ static void ste_rxeof(sc)
struct mbuf *m;
struct ifnet *ifp;
struct ste_chain_onefrag *cur_rx;
- int total_len = 0;
+ int total_len = 0, count=0;
u_int32_t rxstat;
ifp = &sc->arpcom.ac_if;
-again:
+ while((rxstat = sc->ste_cdata.ste_rx_head->ste_ptr->ste_status)
+ & STE_RXSTAT_DMADONE) {
+ if ((STE_RX_LIST_CNT - count) < 3) {
+ break;
+ }
- while((rxstat = sc->ste_cdata.ste_rx_head->ste_ptr->ste_status)) {
cur_rx = sc->ste_cdata.ste_rx_head;
sc->ste_cdata.ste_rx_head = cur_rx->ste_next;
@@ -732,29 +740,9 @@ again:
/* Remove header from mbuf and pass it on. */
m_adj(m, sizeof(struct ether_header));
ether_input(ifp, eh, m);
- }
- /*
- * Handle the 'end of channel' condition. When the upload
- * engine hits the end of the RX ring, it will stall. This
- * is our cue to flush the RX ring, reload the uplist pointer
- * register and unstall the engine.
- * XXX This is actually a little goofy. With the ThunderLAN
- * chip, you get an interrupt when the receiver hits the end
- * of the receive ring, which tells you exactly when you
- * you need to reload the ring pointer. Here we have to
- * fake it. I'm mad at myself for not being clever enough
- * to avoid the use of a goto here.
- */
- if (CSR_READ_4(sc, STE_RX_DMALIST_PTR) == 0 ||
- CSR_READ_4(sc, STE_DMACTL) & STE_DMACTL_RXDMA_STOPPED) {
- STE_SETBIT4(sc, STE_DMACTL, STE_DMACTL_RXDMA_STALL);
- ste_wait(sc);
- CSR_WRITE_4(sc, STE_RX_DMALIST_PTR,
- vtophys(&sc->ste_ldata->ste_rx_list[0]));
- sc->ste_cdata.ste_rx_head = &sc->ste_cdata.ste_rx_chain[0];
- STE_SETBIT4(sc, STE_DMACTL, STE_DMACTL_RXDMA_UNSTALL);
- goto again;
+ cur_rx->ste_ptr->ste_status = 0;
+ count++;
}
return;
@@ -838,11 +826,8 @@ static void ste_stats_update(xsc)
void *xsc;
{
struct ste_softc *sc;
- struct ste_stats stats;
struct ifnet *ifp;
struct mii_data *mii;
- int i;
- u_int8_t *p;
sc = xsc;
STE_LOCK(sc);
@@ -850,22 +835,23 @@ static void ste_stats_update(xsc)
ifp = &sc->arpcom.ac_if;
mii = device_get_softc(sc->ste_miibus);
- p = (u_int8_t *)&stats;
+ ifp->if_collisions += CSR_READ_1(sc, STE_LATE_COLLS)
+ + CSR_READ_1(sc, STE_MULTI_COLLS)
+ + CSR_READ_1(sc, STE_SINGLE_COLLS);
- for (i = 0; i < sizeof(stats); i++) {
- *p = CSR_READ_1(sc, STE_STATS + i);
- p++;
- }
-
- ifp->if_collisions += stats.ste_single_colls +
- stats.ste_multi_colls + stats.ste_late_colls;
-
- mii_tick(mii);
- if (!sc->ste_link && mii->mii_media_status & IFM_ACTIVE &&
- IFM_SUBTYPE(mii->mii_media_active) != IFM_NONE) {
- sc->ste_link++;
- if (ifp->if_snd.ifq_head != NULL)
- ste_start(ifp);
+ if (!sc->ste_link) {
+ mii_pollstat(mii);
+ if (mii->mii_media_status & IFM_ACTIVE &&
+ IFM_SUBTYPE(mii->mii_media_active) != IFM_NONE) {
+ sc->ste_link++;
+ /*
+ * we don't get a call-back on re-init so do it
+ * otherwise we get stuck in the wrong link state
+ */
+ ste_miibus_statchg(sc->ste_dev);
+ if (ifp->if_snd.ifq_head != NULL)
+ ste_start(ifp);
+ }
}
sc->ste_stat_ch = timeout(ste_stats_update, sc, hz);
@@ -913,6 +899,7 @@ static int ste_attach(dev)
sc = device_get_softc(dev);
unit = device_get_unit(dev);
bzero(sc, sizeof(struct ste_softc));
+ sc->ste_dev = dev;
mtx_init(&sc->ste_mtx, device_get_nameunit(dev), MTX_NETWORK_LOCK,
MTX_DEF | MTX_RECURSE);
@@ -1065,10 +1052,18 @@ static int ste_attach(dev)
ifp->if_baudrate = 10000000;
ifp->if_snd.ifq_maxlen = STE_TX_LIST_CNT - 1;
+ sc->ste_tx_thresh = STE_TXSTART_THRESH;
+
/*
* Call MI attach routine.
*/
ether_ifattach(ifp, ETHER_BPF_SUPPORTED);
+
+ /*
+ * Tell the upper layer(s) we support long frames.
+ */
+ ifp->if_data.ifi_hdrlen = sizeof(struct ether_vlan_header);
+
STE_UNLOCK(sc);
return(0);
@@ -1134,7 +1129,7 @@ static int ste_newbuf(sc, c, m)
c->ste_mbuf = m_new;
c->ste_ptr->ste_status = 0;
c->ste_ptr->ste_frag.ste_addr = vtophys(mtod(m_new, caddr_t));
- c->ste_ptr->ste_frag.ste_len = 1536 | STE_FRAG_LAST;
+ c->ste_ptr->ste_frag.ste_len = (1536 + EVL_ENCAPLEN) | STE_FRAG_LAST;
return(0);
}
@@ -1164,7 +1159,7 @@ static int ste_init_rx_list(sc)
ld->ste_rx_list[i].ste_next =
vtophys(&ld->ste_rx_list[i + 1]);
}
-
+ ld->ste_rx_list[i].ste_status = 0;
}
cd->ste_rx_head = &cd->ste_rx_chain[0];
@@ -1183,6 +1178,8 @@ static void ste_init_tx_list(sc)
ld = sc->ste_ldata;
for (i = 0; i < STE_TX_LIST_CNT; i++) {
cd->ste_tx_chain[i].ste_ptr = &ld->ste_tx_list[i];
+ cd->ste_tx_chain[i].ste_ptr->ste_next = 0;
+ cd->ste_tx_chain[i].ste_ptr->ste_ctl = 0;
cd->ste_tx_chain[i].ste_phys = vtophys(&ld->ste_tx_list[i]);
if (i == (STE_TX_LIST_CNT - 1))
cd->ste_tx_chain[i].ste_next =
@@ -1198,10 +1195,6 @@ static void ste_init_tx_list(sc)
&cd->ste_tx_chain[i - 1];
}
-
- bzero((char *)ld->ste_tx_list,
- sizeof(struct ste_desc) * STE_TX_LIST_CNT);
-
cd->ste_tx_prod = 0;
cd->ste_tx_cons = 0;
cd->ste_tx_cnt = 0;
@@ -1238,6 +1231,9 @@ static void ste_init(xsc)
return;
}
+ /* Set RX polling interval */
+ CSR_WRITE_1(sc, STE_RX_DMAPOLL_PERIOD, 1);
+
/* Init TX descriptors */
ste_init_tx_list(sc);
@@ -1277,20 +1273,21 @@ static void ste_init(xsc)
STE_SETBIT4(sc, STE_DMACTL, STE_DMACTL_RXDMA_UNSTALL);
STE_SETBIT4(sc, STE_DMACTL, STE_DMACTL_RXDMA_UNSTALL);
- /* Set TX polling interval */
- CSR_WRITE_1(sc, STE_TX_DMAPOLL_PERIOD, 64);
+ /* Set TX polling interval (defer until we TX first packet */
+ CSR_WRITE_1(sc, STE_TX_DMAPOLL_PERIOD, 0);
/* Load address of the TX list */
STE_SETBIT4(sc, STE_DMACTL, STE_DMACTL_TXDMA_STALL);
ste_wait(sc);
- CSR_WRITE_4(sc, STE_TX_DMALIST_PTR,
- vtophys(&sc->ste_ldata->ste_tx_list[0]));
+ CSR_WRITE_4(sc, STE_TX_DMALIST_PTR, 0);
STE_SETBIT4(sc, STE_DMACTL, STE_DMACTL_TXDMA_UNSTALL);
STE_SETBIT4(sc, STE_DMACTL, STE_DMACTL_TXDMA_UNSTALL);
ste_wait(sc);
+ sc->ste_tx_prev_idx=-1;
/* Enable receiver and transmitter */
CSR_WRITE_2(sc, STE_MACCTL0, 0);
+ CSR_WRITE_2(sc, STE_MACCTL1, 0);
STE_SETBIT2(sc, STE_MACCTL1, STE_MACCTL1_TX_ENABLE);
STE_SETBIT2(sc, STE_MACCTL1, STE_MACCTL1_RX_ENABLE);
@@ -1301,6 +1298,9 @@ static void ste_init(xsc)
CSR_WRITE_2(sc, STE_ISR, 0xFFFF);
CSR_WRITE_2(sc, STE_IMR, STE_INTRS);
+ /* Accept VLAN length packets */
+ CSR_WRITE_2(sc, STE_MAX_FRAMELEN, ETHER_MAX_LEN + EVL_ENCAPLEN);
+
ste_ifmedia_upd(ifp);
ifp->if_flags |= IFF_RUNNING;
@@ -1330,6 +1330,11 @@ static void ste_stop(sc)
STE_SETBIT2(sc, STE_DMACTL, STE_DMACTL_TXDMA_STALL);
STE_SETBIT2(sc, STE_DMACTL, STE_DMACTL_RXDMA_STALL);
ste_wait(sc);
+ /*
+ * Try really hard to stop the RX engine or under heavy RX
+ * data chip will write into de-allocated memory.
+ */
+ ste_reset(sc);
sc->ste_link = 0;
@@ -1347,6 +1352,8 @@ static void ste_stop(sc)
}
}
+ bzero(sc->ste_ldata, sizeof(struct ste_list_data));
+
ifp->if_flags &= ~(IFF_RUNNING|IFF_OACTIVE);
STE_UNLOCK(sc);
@@ -1410,8 +1417,10 @@ static int ste_ioctl(ifp, command, data)
sc->ste_if_flags & IFF_PROMISC) {
STE_CLRBIT1(sc, STE_RX_MODE,
STE_RXMODE_PROMISC);
- } else if (!(ifp->if_flags & IFF_RUNNING)) {
- sc->ste_tx_thresh = STE_MIN_FRAMELEN;
+ }
+ if (!(ifp->if_flags & IFF_RUNNING)) {
+ sc->ste_tx_thresh = STE_MIN_FRAMELEN * 2;
+ sc->ste_tx_thresh = STE_TXSTART_THRESH;
ste_init(sc);
}
} else {
@@ -1454,14 +1463,13 @@ static int ste_encap(sc, c, m_head)
d = c->ste_ptr;
d->ste_ctl = 0;
- d->ste_next = 0;
for (m = m_head, frag = 0; m != NULL; m = m->m_next) {
if (m->m_len != 0) {
if (frag == STE_MAXFRAGS)
break;
total_len += m->m_len;
- f = &c->ste_ptr->ste_frags[frag];
+ f = &d->ste_frags[frag];
f->ste_addr = vtophys(mtod(m, vm_offset_t));
f->ste_len = m->m_len;
frag++;
@@ -1469,8 +1477,8 @@ static int ste_encap(sc, c, m_head)
}
c->ste_mbuf = m_head;
- c->ste_ptr->ste_frags[frag - 1].ste_len |= STE_FRAG_LAST;
- c->ste_ptr->ste_ctl = total_len;
+ d->ste_frags[frag - 1].ste_len |= STE_FRAG_LAST;
+ d->ste_ctl = 1;
return(0);
}
@@ -1480,7 +1488,7 @@ static void ste_start(ifp)
{
struct ste_softc *sc;
struct mbuf *m_head = NULL;
- struct ste_chain *prev = NULL, *cur_tx = NULL, *start_tx;
+ struct ste_chain *cur_tx = NULL;
int idx;
sc = ifp->if_softc;
@@ -1497,7 +1505,6 @@ static void ste_start(ifp)
}
idx = sc->ste_cdata.ste_tx_prod;
- start_tx = &sc->ste_cdata.ste_tx_chain[idx];
while(sc->ste_cdata.ste_tx_chain[idx].ste_mbuf == NULL) {
@@ -1514,9 +1521,32 @@ static void ste_start(ifp)
ste_encap(sc, cur_tx, m_head);
- if (prev != NULL)
- prev->ste_ptr->ste_next = cur_tx->ste_phys;
- prev = cur_tx;
+ cur_tx->ste_ptr->ste_next = 0;
+
+ if(sc->ste_tx_prev_idx < 0){
+ cur_tx->ste_ptr->ste_ctl = STE_TXCTL_DMAINTR | 1;
+ /* Load address of the TX list */
+ STE_SETBIT4(sc, STE_DMACTL, STE_DMACTL_TXDMA_STALL);
+ ste_wait(sc);
+
+ CSR_WRITE_4(sc, STE_TX_DMALIST_PTR,
+ vtophys(&sc->ste_ldata->ste_tx_list[0]));
+
+ /* Set TX polling interval to start TX engine */
+ CSR_WRITE_1(sc, STE_TX_DMAPOLL_PERIOD, 64);
+
+ STE_SETBIT4(sc, STE_DMACTL, STE_DMACTL_TXDMA_UNSTALL);
+ STE_SETBIT4(sc, STE_DMACTL, STE_DMACTL_TXDMA_UNSTALL);
+ ste_wait(sc);
+
+ }else{
+ cur_tx->ste_ptr->ste_ctl = STE_TXCTL_DMAINTR | 1;
+ sc->ste_cdata.ste_tx_chain[
+ sc->ste_tx_prev_idx].ste_ptr->ste_next
+ = cur_tx->ste_phys;
+ }
+
+ sc->ste_tx_prev_idx=idx;
/*
* If there's a BPF listener, bounce a copy of this frame
@@ -1527,20 +1557,10 @@ static void ste_start(ifp)
STE_INC(idx, STE_TX_LIST_CNT);
sc->ste_cdata.ste_tx_cnt++;
+ ifp->if_timer = 5;
+ sc->ste_cdata.ste_tx_prod = idx;
}
- if (cur_tx == NULL) {
- STE_UNLOCK(sc);
- return;
- }
-
- cur_tx->ste_ptr->ste_ctl |= STE_TXCTL_DMAINTR;
-
- /* Start transmission */
- sc->ste_cdata.ste_tx_prod = idx;
- start_tx->ste_prev->ste_ptr->ste_next = start_tx->ste_phys;
-
- ifp->if_timer = 5;
STE_UNLOCK(sc);
return;
OpenPOWER on IntegriCloud