const PREFERRED_VECTOR_SIZE_NON_NULL: usize = _; // 32usize
non-nullable aggregation requires fewer temporary registers so we can use more of them for accumulators