@@ -64,7 +64,6 @@ getWarpsPerTile(tt::DotOp dotOp,
6464 ceil<uint32_t >(dpasCap.repeatCount , dpasCap.executionSize );
6565 uint32_t colRowRatio =
6666 ceil<uint32_t >(dpasCap.executionSize , dpasCap.repeatCount );
67- llvm::errs () << " rowColRation: " << rowColRatio << " , colRowRatio: " << colRowRatio << " , ret: " << ret[0 ] << " , " << ret[1 ] << " \n " ;
6867
6968 int rowDim = order[rank - 2 ], colDim = order[rank - 1 ];
7069 do {
@@ -119,20 +118,19 @@ class BlockedToDPAS : public OpRewritePattern<tt::DotOp> {
119118 unsigned opsPerChan =
120119 ttg::intel::DpasEncodingAttr::getOpsPerChannel (elemType);
121120
122- SmallVector<unsigned > order = {0 , 1 };
121+ SmallVector<unsigned > order = {0 , 1 };
123122 Operation *aOp = a.getDefiningOp ();
124123 if (isa<ttg::ConvertLayoutOp>(aOp)) {
125- auto valueToConvert = aOp->getOperand (0 );
126- aOp = valueToConvert.getDefiningOp ();
124+ auto valueToConvert = aOp->getOperand (0 );
125+ aOp = valueToConvert.getDefiningOp ();
127126 }
128127 if (aOp && isa<tt::LoadOp>(aOp)) {
129128 Attribute layout;
130- assert (aOp->getNumResults () == 1 );
131- layout =
132- cast<RankedTensorType>(aOp->getResult (0 ).getType ()).getEncoding ();
129+ assert (aOp->getNumResults () == 1 );
130+ layout =
131+ cast<RankedTensorType>(aOp->getResult (0 ).getType ()).getEncoding ();
133132 order = triton::gpu::getOrder (layout);
134133 }
135- llvm::errs () << " order: " << order[0 ] << " , " << order[1 ] << " \n " ;
136134
137135 SmallVector<unsigned > warpsPerTile =
138136 getWarpsPerTile (dotOp, dpasCap, retShape, numWarps, order);
0 commit comments