unroll transpose

This commit is contained in:
louisfd 2024-06-28 11:08:56 -04:00
parent 081fd782af
commit 61ca9ff0b6
1 changed files with 3 additions and 1 deletions

View File

@ -193,7 +193,9 @@ fn write_tile_transposed<F: Float>(
} else {
for i in range(0u32, Comptime::get(tile_size), unroll) {
let mut transposed = F::vectorized(0., Comptime::get(tile_size));
for j in range(0u32, Comptime::get(tile_size), unroll) {
// Unrolling this one makes the difference
for j in range(0u32, Comptime::get(tile_size), Comptime::new(true)) {
transposed[j] = tile[j][i];
}