template inline T findMSBS32(T x) { return select(clz(T(0)) - (clz(x) + T(1)), T(-1), x == T(0)); }