Skip to content

Commit

Permalink
Merge branch 'feature/ntt_benchmark_roofline_3' of https://github.com…
Browse files Browse the repository at this point in the history
…/kendryte/nncase into feature/ntt_benchmark_roofline_3
  • Loading branch information
guodongliang committed Sep 30, 2024
2 parents a553d9a + 0faa9c3 commit bfcbeb1
Showing 1 changed file with 3 additions and 2 deletions.
5 changes: 3 additions & 2 deletions src/Native/include/nncase/ntt/ukernels/u_matmul.h
Original file line number Diff line number Diff line change
Expand Up @@ -210,8 +210,9 @@ struct u_matmul<ukernels::mamtul_pack_kind::pack_mkn, AccumulateC, M0Tile,
});

for (size_t k1 = 0; k1 < K; k1++) {
volatile size_t sk1_max = TLhsElem::shape()[1];
[[assume(sk1_max > 0)]];
// Force compiler do not unroll the loop
size_t sk1_max = TLhsElem::shape()[1];
#pragma GCC unroll 1
for (size_t sk1 = 0; sk1 < sk1_max; sk1++) {
using TSubLhsElem = typename TLhsElem::element_type;
using TSubRhsElem =
Expand Down

0 comments on commit bfcbeb1

Please sign in to comment.