diff options
author | David Gwynne <dlg@cvs.openbsd.org> | 2020-12-17 04:15:04 +0000 |
---|---|---|
committer | David Gwynne <dlg@cvs.openbsd.org> | 2020-12-17 04:15:04 +0000 |
commit | e4034b0ab677f79f8d83dacb9e0bf49feae9deed (patch) | |
tree | 3da44ebacea08ad31b63413a2b9bf5bd5204b733 /sys/dev/pci | |
parent | 7a639ca841756f33e666fd79d9b0bd2d158528ba (diff) |
rework the maths used to set mbuf timestamps.
there's a comment that explains how it works now, but the result is
that i get much tighter and more consistent synchronisation between
the kernel clock and the values derived from the mcx timestamps
now.
however, i only just worked out that there is still an unresolved
problem where the kernel clock changes how fast it ticks. this
happens when ntpd uses adjtime(2) or adjfreq(2) to try and make the
kernel tick at the same rate as the rest of the universe (well, the
small bit of it that it can observe). these adjustments to the
kernel clock immediately skew the timestamps that mcx calculates,
but then it also throws off the mcx calibration calculations that
run every 30 seconds. the offsets calculated in the next calibration
period are often (very) negative.
eg, when things are synced up nicely and you do a read of the mcx
timer and immediately follow it with a nanouptime(9) call, on this
box it calculates that the time in between those two events is about
2600ns. in the calibration period after ntpd did a very small adjtime
call, it now thinks the time between those two events is -700000ns.
this is a pretty obvious problem in hindsight. i can't think of a
simple solution to it at the moment though so i'm going to leave
mcx timestamping disabled for now.
Diffstat (limited to 'sys/dev/pci')
-rw-r--r-- | sys/dev/pci/if_mcx.c | 39 |
1 files changed, 26 insertions, 13 deletions
diff --git a/sys/dev/pci/if_mcx.c b/sys/dev/pci/if_mcx.c index 30b8927887a..8f33ccd1bbd 100644 --- a/sys/dev/pci/if_mcx.c +++ b/sys/dev/pci/if_mcx.c @@ -1,4 +1,4 @@ -/* $OpenBSD: if_mcx.c,v 1.79 2020/12/15 03:40:29 dlg Exp $ */ +/* $OpenBSD: if_mcx.c,v 1.80 2020/12/17 04:15:03 dlg Exp $ */ /* * Copyright (c) 2017 David Gwynne <dlg@openbsd.org> @@ -2252,12 +2252,11 @@ struct mcx_calibration { uint64_t c_uptime; /* previous kernel nanouptime */ uint64_t c_tbase; /* mcx chip time */ uint64_t c_ubase; /* kernel nanouptime */ - uint64_t c_tdiff; - uint64_t c_udiff; + uint64_t c_ratio; }; #define MCX_CALIBRATE_FIRST 2 -#define MCX_CALIBRATE_NORMAL 30 +#define MCX_CALIBRATE_NORMAL 32 struct mcx_rx { struct mcx_softc *rx_softc; @@ -6599,18 +6598,19 @@ mcx_calibrate_first(struct mcx_softc *sc) c->c_ubase = mcx_uptime(); c->c_tbase = mcx_timer(sc); splx(s); - c->c_tdiff = 0; + c->c_ratio = 0; timeout_add_sec(&sc->sc_calibrate, MCX_CALIBRATE_FIRST); } -#define MCX_TIMESTAMP_SHIFT 10 +#define MCX_TIMESTAMP_SHIFT 24 static void mcx_calibrate(void *arg) { struct mcx_softc *sc = arg; struct mcx_calibration *nc, *pc; + uint64_t udiff, tdiff; unsigned int gen; int s; @@ -6632,8 +6632,19 @@ mcx_calibrate(void *arg) nc->c_tbase = mcx_timer(sc); splx(s); - nc->c_udiff = (nc->c_ubase - nc->c_uptime) >> MCX_TIMESTAMP_SHIFT; - nc->c_tdiff = (nc->c_tbase - nc->c_timestamp) >> MCX_TIMESTAMP_SHIFT; + udiff = nc->c_ubase - nc->c_uptime; + tdiff = nc->c_tbase - nc->c_timestamp; + + /* + * udiff is the wall clock time between calibration ticks, + * which should be 32 seconds or 32 billion nanoseconds. if + * we squint, 1 billion nanoseconds is kind of like a 32 bit + * number, so 32 billion should still have a lot of high bits + * spare. we use this space by shifting the nanoseconds up + * 24 bits so we have a nice big number to divide by the + * number of mcx timer ticks. + */ + nc->c_ratio = (udiff << MCX_TIMESTAMP_SHIFT) / tdiff; membar_producer(); sc->sc_calibration_gen = gen; @@ -6680,12 +6691,14 @@ mcx_process_rx(struct mcx_softc *sc, struct mcx_rx *rx, } #endif - if (ISSET(sc->sc_ac.ac_if.if_flags, IFF_LINK0) && c->c_tdiff) { - uint64_t t = bemtoh64(&cqe->cq_timestamp) - c->c_timestamp; - t *= c->c_udiff; - t /= c->c_tdiff; + if (ISSET(sc->sc_ac.ac_if.if_flags, IFF_LINK0) && c->c_ratio) { + uint64_t t = bemtoh64(&cqe->cq_timestamp); + t -= c->c_timestamp; + t *= c->c_ratio; + t >>= MCX_TIMESTAMP_SHIFT; + t += c->c_uptime; - m->m_pkthdr.ph_timestamp = c->c_uptime + t; + m->m_pkthdr.ph_timestamp = t; SET(m->m_pkthdr.csum_flags, M_TIMESTAMP); } |