WAITING_BITS
#define MAX_WAITING_CPUS (1 << WAITING_BITS)
all = coupled->online_count | (coupled->online_count << WAITING_BITS);
int r = atomic_read(&coupled->ready_waiting_counts) >> WAITING_BITS;
int r = atomic_read(&coupled->ready_waiting_counts) >> WAITING_BITS;