Fix issues with zeroing and fetching the counters, on x86 and ppc64.

Issues were noted by Bruce Evans and are present on all architectures.

On i386, a counter fetch should use atomic read of 64bit value,
otherwise carry from the increment on other CPU could be lost for the
given fetch, making error of 2^32.  If 64bit read (cmpxchg8b) is not
available on the machine, it cannot be SMP and it is enough to disable
preemption around read to avoid the split read.

On x86 the counter increment is not atomic on purpose, which makes it
possible for the store of the incremented result to override just
zeroed per-cpu slot.  The effect would be a counter going off by
arbitrary value after zeroing.  Perform the counter zeroing on the
same processor which does the increments, making the operations
mutually exclusive.  On i386, same as for the fetching, if the
cmpxchg8b is not available, machine is not SMP and we disable
preemption for zeroing.

PowerPC64 is treated the same as amd64.

For other architectures, the changes made to allow the compilation to
succeed, without fixing the issues with zeroing or fetching.  It
should be possible to handle them by using the 64bit loads and stores
atomic WRT preemption (assuming the architectures also converted from
using critical sections to proper asm).  If architecture does not
provide the facility, using global (spin) mutex would be non-optimal
but working solution.

Noted by:  bde
Sponsored by:	The FreeBSD Foundation
This commit is contained in:
Konstantin Belousov 2013-07-01 02:48:27 +00:00
parent 7476f6973c
commit 70a7dd5d5b
Notes: svn2git 2020-12-20 02:59:44 +00:00
svn path=/head/; revision=252434
8 changed files with 370 additions and 11 deletions

View file

@ -36,6 +36,44 @@ extern struct pcpu __pcpu[1];
#define counter_enter() do {} while (0) #define counter_enter() do {} while (0)
#define counter_exit() do {} while (0) #define counter_exit() do {} while (0)
#ifdef IN_SUBR_COUNTER_C
static inline uint64_t
counter_u64_read_one(uint64_t *p, int cpu)
{
return (*(uint64_t *)((char *)p + sizeof(struct pcpu) * cpu));
}
static inline uint64_t
counter_u64_fetch_inline(uint64_t *p)
{
uint64_t r;
int i;
r = 0;
for (i = 0; i < mp_ncpus; i++)
r += counter_u64_read_one((uint64_t *)p, i);
return (r);
}
static void
counter_u64_zero_one_cpu(void *arg)
{
*((uint64_t *)((char *)arg + sizeof(struct pcpu) *
PCPU_GET(cpuid))) = 0;
}
static inline void
counter_u64_zero_inline(counter_u64_t c)
{
smp_rendezvous(smp_no_rendevous_barrier, counter_u64_zero_one_cpu,
smp_no_rendevous_barrier, c);
}
#endif
#define counter_u64_add_protected(c, i) counter_u64_add(c, i) #define counter_u64_add_protected(c, i) counter_u64_add(c, i)
static inline void static inline void

View file

@ -37,6 +37,46 @@
#define counter_enter() critical_enter() #define counter_enter() critical_enter()
#define counter_exit() critical_exit() #define counter_exit() critical_exit()
#ifdef IN_SUBR_COUNTER_C
/* XXXKIB non-atomic 64bit read */
static inline uint64_t
counter_u64_read_one(uint64_t *p, int cpu)
{
return (*(uint64_t *)((char *)p + sizeof(struct pcpu) * cpu));
}
static inline uint64_t
counter_u64_fetch_inline(uint64_t *p)
{
uint64_t r;
int i;
r = 0;
for (i = 0; i < mp_ncpus; i++)
r += counter_u64_read_one((uint64_t *)p, i);
return (r);
}
/* XXXKIB non-atomic 64bit store, might interrupt increment */
static void
counter_u64_zero_one_cpu(void *arg)
{
*((uint64_t *)((char *)arg + sizeof(struct pcpu) *
PCPU_GET(cpuid))) = 0;
}
static inline void
counter_u64_zero_inline(counter_u64_t c)
{
smp_rendezvous(smp_no_rendevous_barrier, counter_u64_zero_one_cpu,
smp_no_rendevous_barrier, c);
}
#endif
#define counter_u64_add_protected(c, inc) do { \ #define counter_u64_add_protected(c, inc) do { \
CRITICAL_ASSERT(curthread); \ CRITICAL_ASSERT(curthread); \
*(uint64_t *)zpcpu_get(c) += (inc); \ *(uint64_t *)zpcpu_get(c) += (inc); \

View file

@ -67,6 +67,93 @@ counter_64_inc_8b(uint64_t *p, int64_t inc)
: "memory", "cc", "eax", "edx", "ebx", "ecx"); : "memory", "cc", "eax", "edx", "ebx", "ecx");
} }
#ifdef IN_SUBR_COUNTER_C
static inline uint64_t
counter_u64_read_one_8b(uint64_t *p)
{
uint32_t res_lo, res_high;
__asm __volatile(
"movl %%eax,%%ebx\n\t"
"movl %%edx,%%ecx\n\t"
"cmpxchg8b (%2)"
: "=a" (res_lo), "=d"(res_high)
: "SD" (p)
: "cc", "ebx", "ecx");
return (res_lo + ((uint64_t)res_high << 32));
}
static inline uint64_t
counter_u64_fetch_inline(uint64_t *p)
{
uint64_t res;
int i;
res = 0;
if ((cpu_feature & CPUID_CX8) == 0) {
/*
* The machines without cmpxchg8b are not SMP.
* Disabling the preemption provides atomicity of the
* counter reading, since update is done in the
* critical section as well.
*/
critical_enter();
for (i = 0; i < mp_ncpus; i++) {
res += *(uint64_t *)((char *)p +
sizeof(struct pcpu) * i);
}
critical_exit();
} else {
for (i = 0; i < mp_ncpus; i++)
res += counter_u64_read_one_8b((uint64_t *)((char *)p +
sizeof(struct pcpu) * i));
}
return (res);
}
static inline void
counter_u64_zero_one_8b(uint64_t *p)
{
__asm __volatile(
"movl (%0),%%eax\n\t"
"movl 4(%0),%%edx\n"
"xorl %%ebx,%%ebx\n\t"
"xorl %%ecx,%%ecx\n\t"
"1:\n\t"
"cmpxchg8b (%0)\n\t"
"jnz 1b"
:
: "SD" (p)
: "memory", "cc", "eax", "edx", "ebx", "ecx");
}
static void
counter_u64_zero_one_cpu(void *arg)
{
uint64_t *p;
p = (uint64_t *)((char *)arg + sizeof(struct pcpu) * PCPU_GET(cpuid));
counter_u64_zero_one_8b(p);
}
static inline void
counter_u64_zero_inline(counter_u64_t c)
{
int i;
if ((cpu_feature & CPUID_CX8) == 0) {
critical_enter();
for (i = 0; i < mp_ncpus; i++)
*(uint64_t *)((char *)c + sizeof(struct pcpu) * i) = 0;
critical_exit();
} else {
smp_rendezvous(smp_no_rendevous_barrier,
counter_u64_zero_one_cpu, smp_no_rendevous_barrier, c);
}
}
#endif
#define counter_u64_add_protected(c, inc) do { \ #define counter_u64_add_protected(c, inc) do { \
if ((cpu_feature & CPUID_CX8) == 0) { \ if ((cpu_feature & CPUID_CX8) == 0) { \
CRITICAL_ASSERT(curthread); \ CRITICAL_ASSERT(curthread); \

View file

@ -37,6 +37,45 @@
#define counter_enter() critical_enter() #define counter_enter() critical_enter()
#define counter_exit() critical_exit() #define counter_exit() critical_exit()
#ifdef IN_SUBR_COUNTER_C
static inline uint64_t
counter_u64_read_one(uint64_t *p, int cpu)
{
return (*(uint64_t *)((char *)p + sizeof(struct pcpu) * cpu));
}
static inline uint64_t
counter_u64_fetch_inline(uint64_t *p)
{
uint64_t r;
int i;
r = 0;
for (i = 0; i < mp_ncpus; i++)
r += counter_u64_read_one((uint64_t *)p, i);
return (r);
}
/* XXXKIB might interrupt increment */
static void
counter_u64_zero_one_cpu(void *arg)
{
*((uint64_t *)((char *)arg + sizeof(struct pcpu) *
PCPU_GET(cpuid))) = 0;
}
static inline void
counter_u64_zero_inline(counter_u64_t c)
{
smp_rendezvous(smp_no_rendevous_barrier, counter_u64_zero_one_cpu,
smp_no_rendevous_barrier, c);
}
#endif
#define counter_u64_add_protected(c, inc) do { \ #define counter_u64_add_protected(c, inc) do { \
CRITICAL_ASSERT(curthread); \ CRITICAL_ASSERT(curthread); \
*(uint64_t *)zpcpu_get(c) += (inc); \ *(uint64_t *)zpcpu_get(c) += (inc); \

View file

@ -29,34 +29,32 @@ __FBSDID("$FreeBSD$");
#include <sys/param.h> #include <sys/param.h>
#include <sys/systm.h> #include <sys/systm.h>
#include <sys/counter.h>
#include <sys/kernel.h> #include <sys/kernel.h>
#include <sys/lock.h>
#include <sys/mutex.h>
#include <sys/proc.h>
#include <sys/sched.h>
#include <sys/smp.h> #include <sys/smp.h>
#include <sys/sysctl.h> #include <sys/sysctl.h>
#include <vm/uma.h> #include <vm/uma.h>
#define IN_SUBR_COUNTER_C
#include <sys/counter.h>
static uma_zone_t uint64_pcpu_zone; static uma_zone_t uint64_pcpu_zone;
void void
counter_u64_zero(counter_u64_t c) counter_u64_zero(counter_u64_t c)
{ {
int i;
for (i = 0; i < mp_ncpus; i++) counter_u64_zero_inline(c);
*(uint64_t *)((char *)c + sizeof(struct pcpu) * i) = 0;
} }
uint64_t uint64_t
counter_u64_fetch(counter_u64_t c) counter_u64_fetch(counter_u64_t c)
{ {
uint64_t r;
int i;
r = 0; return (counter_u64_fetch_inline(c));
for (i = 0; i < mp_ncpus; i++)
r += *(uint64_t *)((char *)c + sizeof(struct pcpu) * i);
return (r);
} }
counter_u64_t counter_u64_t

View file

@ -37,6 +37,46 @@
#define counter_enter() critical_enter() #define counter_enter() critical_enter()
#define counter_exit() critical_exit() #define counter_exit() critical_exit()
#ifdef IN_SUBR_COUNTER_C
/* XXXKIB non-atomic 64bit read on 32bit */
static inline uint64_t
counter_u64_read_one(uint64_t *p, int cpu)
{
return (*(uint64_t *)((char *)p + sizeof(struct pcpu) * cpu));
}
static inline uint64_t
counter_u64_fetch_inline(uint64_t *p)
{
uint64_t r;
int i;
r = 0;
for (i = 0; i < mp_ncpus; i++)
r += counter_u64_read_one((uint64_t *)p, i);
return (r);
}
/* XXXKIB non-atomic 64bit store on 32bit, might interrupt increment */
static void
counter_u64_zero_one_cpu(void *arg)
{
*((uint64_t *)((char *)arg + sizeof(struct pcpu) *
PCPU_GET(cpuid))) = 0;
}
static inline void
counter_u64_zero_inline(counter_u64_t c)
{
smp_rendezvous(smp_no_rendevous_barrier, counter_u64_zero_one_cpu,
smp_no_rendevous_barrier, c);
}
#endif
#define counter_u64_add_protected(c, inc) do { \ #define counter_u64_add_protected(c, inc) do { \
CRITICAL_ASSERT(curthread); \ CRITICAL_ASSERT(curthread); \
*(uint64_t *)zpcpu_get(c) += (inc); \ *(uint64_t *)zpcpu_get(c) += (inc); \

View file

@ -39,6 +39,44 @@
#define counter_enter() do {} while (0) #define counter_enter() do {} while (0)
#define counter_exit() do {} while (0) #define counter_exit() do {} while (0)
#ifdef IN_SUBR_COUNTER_C
static inline uint64_t
counter_u64_read_one(uint64_t *p, int cpu)
{
return (*(uint64_t *)((char *)p + sizeof(struct pcpu) * cpu));
}
static inline uint64_t
counter_u64_fetch_inline(uint64_t *p)
{
uint64_t r;
int i;
r = 0;
for (i = 0; i < mp_ncpus; i++)
r += counter_u64_read_one((uint64_t *)p, i);
return (r);
}
static void
counter_u64_zero_one_cpu(void *arg)
{
*((uint64_t *)((char *)arg + sizeof(struct pcpu) *
PCPU_GET(cpuid))) = 0;
}
static inline void
counter_u64_zero_inline(counter_u64_t c)
{
smp_rendezvous(smp_no_rendevous_barrier, counter_u64_zero_one_cpu,
smp_no_rendevous_barrier, c);
}
#endif
#define counter_u64_add_protected(c, i) counter_u64_add(c, i) #define counter_u64_add_protected(c, i) counter_u64_add(c, i)
extern struct pcpu __pcpu[MAXCPU]; extern struct pcpu __pcpu[MAXCPU];
@ -65,6 +103,46 @@ counter_u64_add(counter_u64_t c, int64_t inc)
#define counter_enter() critical_enter() #define counter_enter() critical_enter()
#define counter_exit() critical_exit() #define counter_exit() critical_exit()
#ifdef IN_SUBR_COUNTER_C
/* XXXKIB non-atomic 64bit read */
static inline uint64_t
counter_u64_read_one(uint64_t *p, int cpu)
{
return (*(uint64_t *)((char *)p + sizeof(struct pcpu) * cpu));
}
static inline uint64_t
counter_u64_fetch_inline(uint64_t *p)
{
uint64_t r;
int i;
r = 0;
for (i = 0; i < mp_ncpus; i++)
r += counter_u64_read_one((uint64_t *)p, i);
return (r);
}
/* XXXKIB non-atomic 64bit store, might interrupt increment */
static void
counter_u64_zero_one_cpu(void *arg)
{
*((uint64_t *)((char *)arg + sizeof(struct pcpu) *
PCPU_GET(cpuid))) = 0;
}
static inline void
counter_u64_zero_inline(counter_u64_t c)
{
smp_rendezvous(smp_no_rendevous_barrier, counter_u64_zero_one_cpu,
smp_no_rendevous_barrier, c);
}
#endif
#define counter_u64_add_protected(c, inc) do { \ #define counter_u64_add_protected(c, inc) do { \
CRITICAL_ASSERT(curthread); \ CRITICAL_ASSERT(curthread); \
*(uint64_t *)zpcpu_get(c) += (inc); \ *(uint64_t *)zpcpu_get(c) += (inc); \

View file

@ -37,6 +37,45 @@
#define counter_enter() critical_enter() #define counter_enter() critical_enter()
#define counter_exit() critical_exit() #define counter_exit() critical_exit()
#ifdef IN_SUBR_COUNTER_C
static inline uint64_t
counter_u64_read_one(uint64_t *p, int cpu)
{
return (*(uint64_t *)((char *)p + sizeof(struct pcpu) * cpu));
}
static inline uint64_t
counter_u64_fetch_inline(uint64_t *p)
{
uint64_t r;
int i;
r = 0;
for (i = 0; i < mp_ncpus; i++)
r += counter_u64_read_one((uint64_t *)p, i);
return (r);
}
/* XXXKIB might interrupt increment */
static void
counter_u64_zero_one_cpu(void *arg)
{
*((uint64_t *)((char *)arg + sizeof(struct pcpu) *
PCPU_GET(cpuid))) = 0;
}
static inline void
counter_u64_zero_inline(counter_u64_t c)
{
smp_rendezvous(smp_no_rendevous_barrier, counter_u64_zero_one_cpu,
smp_no_rendevous_barrier, c);
}
#endif
#define counter_u64_add_protected(c, inc) do { \ #define counter_u64_add_protected(c, inc) do { \
CRITICAL_ASSERT(curthread); \ CRITICAL_ASSERT(curthread); \
*(uint64_t *)zpcpu_get(c) += (inc); \ *(uint64_t *)zpcpu_get(c) += (inc); \