in gemmology.h [1072:1076]
void Write::operator()(xsimd::batch<int32_t, Arch> result, size_t row_idx,
size_t col_idx, size_t col_size) {
xsimd::bitwise_cast<float>(result).store_aligned(
output_addr + row_idx * col_size + col_idx);
}