> Date: Sun, 6 Nov 2022 19:42:11 +0000 > From: Scott Cheloha <scottchel...@gmail.com> > > This patch switches arm64 to clockintr(9). > > This has survived about a dozen parallel kernel builds, parallel > release builds, and bsd.rd upgrades on my RPi4b. > > kettenis@ said he tried it on one of his M1 machines, too. > > It could use more testing, particularly on arm64 machines that aren't > a Raspberry Pi. > > Notes: > > - The spec is a little unclear about whether or not the > values written to CNTV_TVAL_EL0 are interpretted as signed > or unsigned. To be safe, I have capped the cycle count at > INT32_MAX.
ok kettenis@ > Index: sys/arch/arm64/dev/agtimer.c > =================================================================== > RCS file: /cvs/src/sys/arch/arm64/dev/agtimer.c,v > retrieving revision 1.19 > diff -u -p -r1.19 agtimer.c > --- sys/arch/arm64/dev/agtimer.c 24 Oct 2021 17:52:28 -0000 1.19 > +++ sys/arch/arm64/dev/agtimer.c 6 Nov 2022 18:48:22 -0000 > @@ -18,10 +18,12 @@ > > #include <sys/param.h> > #include <sys/systm.h> > +#include <sys/clockintr.h> > #include <sys/queue.h> > #include <sys/malloc.h> > #include <sys/device.h> > #include <sys/kernel.h> > +#include <sys/stdint.h> > #include <sys/timetc.h> > #include <sys/evcount.h> > > @@ -53,28 +55,13 @@ static struct timecounter agtimer_timeco > .tc_user = TC_AGTIMER, > }; > > -struct agtimer_pcpu_softc { > - uint64_t pc_nexttickevent; > - uint64_t pc_nextstatevent; > - u_int32_t pc_ticks_err_sum; > -}; > - > struct agtimer_softc { > struct device sc_dev; > int sc_node; > > - struct agtimer_pcpu_softc sc_pstat[MAXCPUS]; > - > - u_int32_t sc_ticks_err_cnt; > u_int32_t sc_ticks_per_second; > - u_int32_t sc_ticks_per_intr; > - u_int32_t sc_statvar; > - u_int32_t sc_statmin; > - > -#ifdef AMPTIMER_DEBUG > - struct evcount sc_clk_count; > - struct evcount sc_stat_count; > -#endif > + uint64_t sc_nsec_cycle_ratio; > + uint64_t sc_nsec_max; > void *sc_ih; > }; > > @@ -84,9 +71,11 @@ uint64_t agtimer_readcnt64(void); > int agtimer_intr(void *); > void agtimer_cpu_initclocks(void); > void agtimer_delay(u_int); > +void agtimer_rearm(void *, uint64_t); > void agtimer_setstatclockrate(int stathz); > void agtimer_set_clockrate(int32_t new_frequency); > void agtimer_startclock(void); > +void agtimer_trigger(void *); > > const struct cfattach agtimer_ca = { > sizeof (struct agtimer_softc), agtimer_match, agtimer_attach > @@ -96,6 +85,11 @@ struct cfdriver agtimer_cd = { > NULL, "agtimer", DV_DULL > }; > > +struct intrclock agtimer_intrclock = { > + .ic_rearm = agtimer_rearm, > + .ic_trigger = agtimer_trigger > +}; > + > uint64_t > agtimer_readcnt64(void) > { > @@ -173,13 +167,11 @@ agtimer_attach(struct device *parent, st > agtimer_frequency = > OF_getpropint(sc->sc_node, "clock-frequency", agtimer_frequency); > sc->sc_ticks_per_second = agtimer_frequency; > + sc->sc_nsec_cycle_ratio = > + sc->sc_ticks_per_second * (1ULL << 32) / 1000000000; > + sc->sc_nsec_max = UINT64_MAX / sc->sc_nsec_cycle_ratio; > > - printf(": %d kHz\n", sc->sc_ticks_per_second / 1000); > - > -#ifdef AMPTIMER_DEBUG > - evcount_attach(&sc->sc_clk_count, "clock", NULL); > - evcount_attach(&sc->sc_stat_count, "stat", NULL); > -#endif > + printf(": %u kHz\n", sc->sc_ticks_per_second / 1000); > > /* > * private timer and interrupts not enabled until > @@ -191,8 +183,9 @@ agtimer_attach(struct device *parent, st > > agtimer_timecounter.tc_frequency = sc->sc_ticks_per_second; > agtimer_timecounter.tc_priv = sc; > - > tc_init(&agtimer_timecounter); > + > + agtimer_intrclock.ic_cookie = sc; > } > > u_int > @@ -209,72 +202,30 @@ agtimer_get_timecount(struct timecounter > return (val & 0xffffffff); > } > > -int > -agtimer_intr(void *frame) > +void > +agtimer_rearm(void *cookie, uint64_t nsecs) > { > - struct agtimer_softc *sc = agtimer_cd.cd_devs[0]; > - struct agtimer_pcpu_softc *pc = &sc->sc_pstat[CPU_INFO_UNIT(curcpu())]; > - uint64_t now; > - uint64_t nextevent; > - uint32_t r; > -#if defined(USE_GTIMER_CMP) > - int skip = 1; > -#else > - int64_t delay; > -#endif > - int rc = 0; > - > - /* > - * DSR - I know that the tick timer is 64 bits, but the following > - * code deals with rollover, so there is no point in dealing > - * with the 64 bit math, just let the 32 bit rollover > - * do the right thing > - */ > - > - now = agtimer_readcnt64(); > + struct agtimer_softc *sc = cookie; > + uint32_t cycles; > > - while (pc->pc_nexttickevent <= now) { > - pc->pc_nexttickevent += sc->sc_ticks_per_intr; > - pc->pc_ticks_err_sum += sc->sc_ticks_err_cnt; > - > - /* looping a few times is faster than divide */ > - while (pc->pc_ticks_err_sum > hz) { > - pc->pc_nexttickevent += 1; > - pc->pc_ticks_err_sum -= hz; > - } > - > -#ifdef AMPTIMER_DEBUG > - sc->sc_clk_count.ec_count++; > -#endif > - rc = 1; > - hardclock(frame); > - } > - while (pc->pc_nextstatevent <= now) { > - do { > - r = random() & (sc->sc_statvar -1); > - } while (r == 0); /* random == 0 not allowed */ > - pc->pc_nextstatevent += sc->sc_statmin + r; > - > - /* XXX - correct nextstatevent? */ > -#ifdef AMPTIMER_DEBUG > - sc->sc_stat_count.ec_count++; > -#endif > - rc = 1; > - statclock(frame); > - } > - > - if (pc->pc_nexttickevent < pc->pc_nextstatevent) > - nextevent = pc->pc_nexttickevent; > - else > - nextevent = pc->pc_nextstatevent; > - > - delay = nextevent - now; > - if (delay < 0) > - delay = 1; > + if (nsecs > sc->sc_nsec_max) > + nsecs = sc->sc_nsec_max; > + cycles = (nsecs * sc->sc_nsec_cycle_ratio) >> 32; > + if (cycles > INT32_MAX) > + cycles = INT32_MAX; > + agtimer_set_tval(cycles); > +} > > - agtimer_set_tval(delay); > +void > +agtimer_trigger(void *unused) > +{ > + agtimer_set_tval(0); > +} > > - return (rc); > +int > +agtimer_intr(void *frame) > +{ > + return clockintr_dispatch(frame); > } > > void > @@ -288,8 +239,13 @@ agtimer_set_clockrate(int32_t new_freque > return; > > sc->sc_ticks_per_second = agtimer_frequency; > + sc->sc_nsec_cycle_ratio = > + sc->sc_ticks_per_second * (1ULL << 32) / 1000000000; > + sc->sc_nsec_max = UINT64_MAX / sc->sc_nsec_cycle_ratio; > + > agtimer_timecounter.tc_frequency = sc->sc_ticks_per_second; > - printf("agtimer0: adjusting clock: new tick rate %d kHz\n", > + > + printf("agtimer0: adjusting clock: new tick rate %u kHz\n", > sc->sc_ticks_per_second / 1000); > } > > @@ -297,37 +253,31 @@ void > agtimer_cpu_initclocks(void) > { > struct agtimer_softc *sc = agtimer_cd.cd_devs[0]; > - struct agtimer_pcpu_softc *pc = &sc->sc_pstat[CPU_INFO_UNIT(curcpu())]; > uint32_t reg; > - uint64_t next; > uint64_t kctl; > > stathz = hz; > - profhz = hz * 10; > + profhz = stathz * 10; > + clockintr_init(CL_RNDSTAT); > > if (sc->sc_ticks_per_second != agtimer_frequency) { > agtimer_set_clockrate(agtimer_frequency); > } > > - agtimer_setstatclockrate(stathz); > - > - sc->sc_ticks_per_intr = sc->sc_ticks_per_second / hz; > - sc->sc_ticks_err_cnt = sc->sc_ticks_per_second % hz; > - pc->pc_ticks_err_sum = 0; > - > /* configure virtual timer interrupt */ > sc->sc_ih = arm_intr_establish_fdt_idx(sc->sc_node, 2, > IPL_CLOCK|IPL_MPSAFE, agtimer_intr, NULL, "tick"); > > - next = agtimer_readcnt64() + sc->sc_ticks_per_intr; > - pc->pc_nexttickevent = pc->pc_nextstatevent = next; > + clockintr_cpu_init(&agtimer_intrclock); > > reg = agtimer_get_ctrl(); > reg &= ~GTIMER_CNTV_CTL_IMASK; > reg |= GTIMER_CNTV_CTL_ENABLE; > - agtimer_set_tval(sc->sc_ticks_per_second); > + agtimer_set_tval(INT32_MAX); > agtimer_set_ctrl(reg); > > + clockintr_trigger(); > + > /* enable userland access to virtual counter */ > kctl = READ_SPECIALREG(CNTKCTL_EL1); > WRITE_SPECIALREG(CNTKCTL_EL1, kctl | CNTKCTL_EL0VCTEN); > @@ -367,48 +317,27 @@ agtimer_delay(u_int usecs) > void > agtimer_setstatclockrate(int newhz) > { > - struct agtimer_softc *sc = agtimer_cd.cd_devs[0]; > - int minint, statint; > - int s; > - > - s = splclock(); > - > - statint = sc->sc_ticks_per_second / newhz; > - /* calculate largest 2^n which is smaller that just over half statint */ > - sc->sc_statvar = 0x40000000; /* really big power of two */ > - minint = statint / 2 + 100; > - while (sc->sc_statvar > minint) > - sc->sc_statvar >>= 1; > - > - sc->sc_statmin = statint - (sc->sc_statvar >> 1); > - > - splx(s); > - > - /* > - * XXX this allows the next stat timer to occur then it switches > - * to the new frequency. Rather than switching instantly. > - */ > + clockintr_setstatclockrate(newhz); > } > > void > agtimer_startclock(void) > { > struct agtimer_softc *sc = agtimer_cd.cd_devs[0]; > - struct agtimer_pcpu_softc *pc = &sc->sc_pstat[CPU_INFO_UNIT(curcpu())]; > - uint64_t nextevent; > uint64_t kctl; > uint32_t reg; > > - nextevent = agtimer_readcnt64() + sc->sc_ticks_per_intr; > - pc->pc_nexttickevent = pc->pc_nextstatevent = nextevent; > - > arm_intr_route(sc->sc_ih, 1, curcpu()); > > + clockintr_cpu_init(&agtimer_intrclock); > + > reg = agtimer_get_ctrl(); > reg &= ~GTIMER_CNTV_CTL_IMASK; > reg |= GTIMER_CNTV_CTL_ENABLE; > - agtimer_set_tval(sc->sc_ticks_per_second); > + agtimer_set_tval(INT32_MAX); > agtimer_set_ctrl(reg); > + > + clockintr_trigger(); > > /* enable userland access to virtual counter */ > kctl = READ_SPECIALREG(CNTKCTL_EL1); > Index: sys/arch/arm64/include/cpu.h > =================================================================== > RCS file: /cvs/src/sys/arch/arm64/include/cpu.h,v > retrieving revision 1.28 > diff -u -p -r1.28 cpu.h > --- sys/arch/arm64/include/cpu.h 29 Aug 2022 02:01:18 -0000 1.28 > +++ sys/arch/arm64/include/cpu.h 6 Nov 2022 18:48:22 -0000 > @@ -81,6 +81,7 @@ void arm32_vector_init(vaddr_t, int); > * Per-CPU information. For now we assume one CPU. > */ > > +#include <sys/clockintr.h> > #include <sys/device.h> > #include <sys/sched.h> > #include <sys/srp.h> > @@ -142,7 +143,7 @@ struct cpu_info { > #ifdef GPROF > struct gmonparam *ci_gmon; > #endif > - > + struct clockintr_queue ci_queue; > char ci_panicbuf[512]; > }; > > Index: sys/arch/arm64/include/_types.h > =================================================================== > RCS file: /cvs/src/sys/arch/arm64/include/_types.h,v > retrieving revision 1.4 > diff -u -p -r1.4 _types.h > --- sys/arch/arm64/include/_types.h 5 Mar 2018 01:15:25 -0000 1.4 > +++ sys/arch/arm64/include/_types.h 6 Nov 2022 18:48:22 -0000 > @@ -34,6 +34,8 @@ > #ifndef _MACHINE__TYPES_H_ > #define _MACHINE__TYPES_H_ > > +#define __HAVE_CLOCKINTR > + > #if defined(_KERNEL) > typedef struct label_t { > long val[13]; > >