mirror of https://github.com/tracel-ai/burn.git
unroll transpose
This commit is contained in:
parent
081fd782af
commit
61ca9ff0b6
|
@ -193,7 +193,9 @@ fn write_tile_transposed<F: Float>(
|
|||
} else {
|
||||
for i in range(0u32, Comptime::get(tile_size), unroll) {
|
||||
let mut transposed = F::vectorized(0., Comptime::get(tile_size));
|
||||
for j in range(0u32, Comptime::get(tile_size), unroll) {
|
||||
|
||||
// Unrolling this one makes the difference
|
||||
for j in range(0u32, Comptime::get(tile_size), Comptime::new(true)) {
|
||||
transposed[j] = tile[j][i];
|
||||
}
|
||||
|
||||
|
|
Loading…
Reference in New Issue