Skip to content

Commit

Permalink
Blas: fix frob inner prod (#2045)
Browse files Browse the repository at this point in the history
  • Loading branch information
wsmoses authored Aug 21, 2024
1 parent 7a5727b commit cc65abd
Showing 1 changed file with 3 additions and 3 deletions.
6 changes: 3 additions & 3 deletions enzyme/Enzyme/Utils.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -1231,8 +1231,8 @@ getorInsertInnerProd(llvm::IRBuilder<> &B, llvm::Module &M, BlasInfo blas,
B3.setFastMathFlags(getFast());
Value *blasA = B3.CreatePointerCast(matA, BlasPT);
Value *blasB = B3.CreatePointerCast(matB, BlasPT);
Value *fastSum = B3.CreateCall(
FDot, {blasSize, blasA, blasOne, blasB, blasOne}, bundles);
Value *fastSum =
B3.CreateCall(FDot, {blasSize, blasA, blasOne, blasB, blasOne});
B3.CreateBr(end);

IRBuilder<> B4(body);
Expand All @@ -1251,7 +1251,7 @@ getorInsertInnerProd(llvm::IRBuilder<> &B, llvm::Module &M, BlasInfo blas,
Value *AiDot = B4.CreatePointerCast(Ai, BlasPT);
Value *BiDot = B4.CreatePointerCast(Bi, BlasPT);
Value *newDot =
B4.CreateCall(FDot, {blasm, AiDot, blasOne, BiDot, blasOne}, bundles);
B4.CreateCall(FDot, {blasm, AiDot, blasOne, BiDot, blasOne});

Value *Anext = B4.CreateNUWAdd(Aidx, lda, "Aidx.next");
Value *Bnext = B4.CreateNUWAdd(Aidx, m, "Bidx.next");
Expand Down

0 comments on commit cc65abd

Please sign in to comment.