t = zeros(1010, 1010)
v = rand(1000, 1000)
c = view(t, 11:1010, 11:1010)
@btime BLAS.gemm!('T', 'N', 1., v, v, 1., c) # 6.135 ms (0 allocations: 0 bytes)
@btime v'v # 5.226 ms (3 allocations: 7.63 MiB)
1 Like