Skip to content

Commit 3571600

Browse files
committed
Don't emit calls to Eigen for the dot operator. Emit an LLVM loop instead to provide visibility to Polly.
1 parent 1340b50 commit 3571600

File tree

1 file changed

+3
-0
lines changed

1 file changed

+3
-0
lines changed

tensorflow/compiler/xla/service/cpu/dot_op_emitter.cc

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1013,6 +1013,7 @@ bool PotentiallyImplementedAsEigenDot(const HloInstruction& hlo) {
10131013
DotInLlvmIrProfitable ProfitableToImplementDotInUntiledLlvmIr(
10141014
const HloInstruction& dot) {
10151015
if (dot.opcode() == HloOpcode::kDot && dot.shape().dimensions_size() == 2) {
1016+
#if 0
10161017
const Shape& result_shape = dot.shape();
10171018
// kReductionDimensionThresholdBytes was chosen to be 1/4 of a typical L1
10181019
// cache line size, so that we can have the reduction dimension of both the
@@ -1048,6 +1049,8 @@ DotInLlvmIrProfitable ProfitableToImplementDotInUntiledLlvmIr(
10481049
? DotInLlvmIrProfitable::kWithColumnMajorRhs
10491050
: DotInLlvmIrProfitable::kYes;
10501051
}
1052+
#endif
1053+
return DotInLlvmIrProfitable::kYes;
10511054
}
10521055
return DotInLlvmIrProfitable::kNo;
10531056
}

0 commit comments

Comments
 (0)