[LV][VPlan] Prevent calculate cost for skiped instructions in precomp… · llvm/llvm-project@5b552d7 (original) (raw)

`@@ -1211,6 +1211,130 @@ exit:

`

1211

1211

`ret i32 %or

`

1212

1212

`}

`

1213

1213

``

``

1214

`+

; Check if the vplan-based cost model select same VF to the legacy cost model.

`

``

1215

`+

; Reduced from: https://github.com/llvm/llvm-project/issues/115744#issuecomment-2670479463

`

``

1216

`+

define i32 @g(i64 %n) {

`

``

1217

`+

; CHECK-LABEL: @g(

`

``

1218

`+

; CHECK-NEXT: iter.check:

`

``

1219

`+

; CHECK-NEXT: [[TMP0:%.]] = trunc i64 [[N:%.]] to i32

`

``

1220

`+

; CHECK-NEXT: [[TMP1:%.*]] = add i32 [[TMP0]], 1

`

``

1221

`+

; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i32 [[TMP1]], 4

`

``

1222

`+

; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label [[VEC_EPILOG_SCALAR_PH:%.]], label [[VECTOR_SCEVCHECK:%.]]

`

``

1223

`+

; CHECK: vector.scevcheck:

`

``

1224

`+

; CHECK-NEXT: [[TMP2:%.*]] = icmp ugt i64 [[N]], 4294967295

`

``

1225

`+

; CHECK-NEXT: br i1 [[TMP2]], label [[VEC_EPILOG_SCALAR_PH]], label [[VECTOR_MAIN_LOOP_ITER_CHECK:%.*]]

`

``

1226

`+

; CHECK: vector.main.loop.iter.check:

`

``

1227

`+

; CHECK-NEXT: [[MIN_ITERS_CHECK1:%.*]] = icmp ult i32 [[TMP1]], 16

`

``

1228

`+

; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK1]], label [[VEC_EPILOG_PH:%.]], label [[VECTOR_PH:%.]]

`

``

1229

`+

; CHECK: vector.ph:

`

``

1230

`+

; CHECK-NEXT: [[N_MOD_VF:%.*]] = urem i32 [[TMP1]], 16

`

``

1231

`+

; CHECK-NEXT: [[N_VEC:%.*]] = sub i32 [[TMP1]], [[N_MOD_VF]]

`

``

1232

`+

; CHECK-NEXT: [[BROADCAST_SPLATINSERT:%.*]] = insertelement <4 x i64> poison, i64 [[N]], i64 0

`

``

1233

`+

; CHECK-NEXT: [[BROADCAST_SPLAT:%.*]] = shufflevector <4 x i64> [[BROADCAST_SPLATINSERT]], <4 x i64> poison, <4 x i32> zeroinitializer

`

``

1234

`+

; CHECK-NEXT: br label [[VECTOR_BODY:%.*]]

`

``

1235

`+

; CHECK: vector.body:

`

``

1236

`+

; CHECK-NEXT: [[INDEX:%.]] = phi i32 [ 0, [[VECTOR_PH]] ], [ [[INDEX_NEXT:%.]], [[VECTOR_BODY]] ]

`

``

1237

`+

; CHECK-NEXT: [[VEC_IND:%.]] = phi <4 x i32> [ <i32 0, i32 1, i32 2, i32 3>, [[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.]], [[VECTOR_BODY]] ]

`

``

1238

`+

; CHECK-NEXT: [[VEC_PHI:%.]] = phi <4 x i32> [ zeroinitializer, [[VECTOR_PH]] ], [ [[TMP15:%.]], [[VECTOR_BODY]] ]

`

``

1239

`+

; CHECK-NEXT: [[VEC_PHI2:%.]] = phi <4 x i32> [ zeroinitializer, [[VECTOR_PH]] ], [ [[TMP16:%.]], [[VECTOR_BODY]] ]

`

``

1240

`+

; CHECK-NEXT: [[VEC_PHI3:%.]] = phi <4 x i32> [ zeroinitializer, [[VECTOR_PH]] ], [ [[TMP17:%.]], [[VECTOR_BODY]] ]

`

``

1241

`+

; CHECK-NEXT: [[VEC_PHI4:%.]] = phi <4 x i32> [ zeroinitializer, [[VECTOR_PH]] ], [ [[TMP18:%.]], [[VECTOR_BODY]] ]

`

``

1242

`+

; CHECK-NEXT: [[STEP_ADD:%.*]] = add <4 x i32> [[VEC_IND]], splat (i32 4)

`

``

1243

`+

; CHECK-NEXT: [[STEP_ADD_2:%.*]] = add <4 x i32> [[STEP_ADD]], splat (i32 4)

`

``

1244

`+

; CHECK-NEXT: [[STEP_ADD_3:%.*]] = add <4 x i32> [[STEP_ADD_2]], splat (i32 4)

`

``

1245

`+

; CHECK-NEXT: [[TMP3:%.*]] = zext <4 x i32> [[VEC_IND]] to <4 x i64>

`

``

1246

`+

; CHECK-NEXT: [[TMP4:%.*]] = zext <4 x i32> [[STEP_ADD]] to <4 x i64>

`

``

1247

`+

; CHECK-NEXT: [[TMP5:%.*]] = zext <4 x i32> [[STEP_ADD_2]] to <4 x i64>

`

``

1248

`+

; CHECK-NEXT: [[TMP6:%.*]] = zext <4 x i32> [[STEP_ADD_3]] to <4 x i64>

`

``

1249

`+

; CHECK-NEXT: [[TMP7:%.*]] = icmp eq <4 x i64> [[BROADCAST_SPLAT]], [[TMP3]]

`

``

1250

`+

; CHECK-NEXT: [[TMP8:%.*]] = icmp eq <4 x i64> [[BROADCAST_SPLAT]], [[TMP4]]

`

``

1251

`+

; CHECK-NEXT: [[TMP9:%.*]] = icmp eq <4 x i64> [[BROADCAST_SPLAT]], [[TMP5]]

`

``

1252

`+

; CHECK-NEXT: [[TMP10:%.*]] = icmp eq <4 x i64> [[BROADCAST_SPLAT]], [[TMP6]]

`

``

1253

`+

; CHECK-NEXT: [[TMP11:%.*]] = select <4 x i1> [[TMP7]], <4 x i32> zeroinitializer, <4 x i32> splat (i32 2)

`

``

1254

`+

; CHECK-NEXT: [[TMP12:%.*]] = select <4 x i1> [[TMP8]], <4 x i32> zeroinitializer, <4 x i32> splat (i32 2)

`

``

1255

`+

; CHECK-NEXT: [[TMP13:%.*]] = select <4 x i1> [[TMP9]], <4 x i32> zeroinitializer, <4 x i32> splat (i32 2)

`

``

1256

`+

; CHECK-NEXT: [[TMP14:%.*]] = select <4 x i1> [[TMP10]], <4 x i32> zeroinitializer, <4 x i32> splat (i32 2)

`

``

1257

`+

; CHECK-NEXT: [[TMP15]] = or <4 x i32> [[TMP11]], [[VEC_PHI]]

`

``

1258

`+

; CHECK-NEXT: [[TMP16]] = or <4 x i32> [[TMP12]], [[VEC_PHI2]]

`

``

1259

`+

; CHECK-NEXT: [[TMP17]] = or <4 x i32> [[TMP13]], [[VEC_PHI3]]

`

``

1260

`+

; CHECK-NEXT: [[TMP18]] = or <4 x i32> [[TMP14]], [[VEC_PHI4]]

`

``

1261

`+

; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i32 [[INDEX]], 16

`

``

1262

`+

; CHECK-NEXT: [[VEC_IND_NEXT]] = add <4 x i32> [[STEP_ADD_3]], splat (i32 4)

`

``

1263

`+

; CHECK-NEXT: [[TMP19:%.*]] = icmp eq i32 [[INDEX_NEXT]], [[N_VEC]]

`

``

1264

`+

; CHECK-NEXT: br i1 [[TMP19]], label [[MIDDLE_BLOCK:%.*]], label [[VECTOR_BODY]], !llvm.loop [[LOOP30:![0-9]+]]

`

``

1265

`+

; CHECK: middle.block:

`

``

1266

`+

; CHECK-NEXT: [[BIN_RDX:%.*]] = or <4 x i32> [[TMP16]], [[TMP15]]

`

``

1267

`+

; CHECK-NEXT: [[BIN_RDX5:%.*]] = or <4 x i32> [[TMP17]], [[BIN_RDX]]

`

``

1268

`+

; CHECK-NEXT: [[BIN_RDX6:%.*]] = or <4 x i32> [[TMP18]], [[BIN_RDX5]]

`

``

1269

`+

; CHECK-NEXT: [[TMP20:%.*]] = call i32 @llvm.vector.reduce.or.v4i32(<4 x i32> [[BIN_RDX6]])

`

``

1270

`+

; CHECK-NEXT: [[CMP_N:%.*]] = icmp eq i32 [[TMP1]], [[N_VEC]]

`

``

1271

`+

; CHECK-NEXT: br i1 [[CMP_N]], label [[EXIT:%.]], label [[VEC_EPILOG_ITER_CHECK:%.]]

`

``

1272

`+

; CHECK: vec.epilog.iter.check:

`

``

1273

`+

; CHECK-NEXT: [[N_VEC_REMAINING:%.*]] = sub i32 [[TMP1]], [[N_VEC]]

`

``

1274

`+

; CHECK-NEXT: [[MIN_EPILOG_ITERS_CHECK:%.*]] = icmp ult i32 [[N_VEC_REMAINING]], 4

`

``

1275

`+

; CHECK-NEXT: br i1 [[MIN_EPILOG_ITERS_CHECK]], label [[VEC_EPILOG_SCALAR_PH]], label [[VEC_EPILOG_PH]]

`

``

1276

`+

; CHECK: vec.epilog.ph:

`

``

1277

`+

; CHECK-NEXT: [[BC_RESUME_VAL:%.*]] = phi i32 [ [[N_VEC]], [[VEC_EPILOG_ITER_CHECK]] ], [ 0, [[VECTOR_MAIN_LOOP_ITER_CHECK]] ]

`

``

1278

`+

; CHECK-NEXT: [[BC_MERGE_RDX:%.*]] = phi i32 [ [[TMP20]], [[VEC_EPILOG_ITER_CHECK]] ], [ 0, [[VECTOR_MAIN_LOOP_ITER_CHECK]] ]

`

``

1279

`+

; CHECK-NEXT: [[N_MOD_VF7:%.*]] = urem i32 [[TMP1]], 4

`

``

1280

`+

; CHECK-NEXT: [[N_VEC8:%.*]] = sub i32 [[TMP1]], [[N_MOD_VF7]]

`

``

1281

`+

; CHECK-NEXT: [[DOTSPLATINSERT:%.*]] = insertelement <4 x i32> poison, i32 [[BC_RESUME_VAL]], i64 0

`

``

1282

`+

; CHECK-NEXT: [[DOTSPLAT:%.*]] = shufflevector <4 x i32> [[DOTSPLATINSERT]], <4 x i32> poison, <4 x i32> zeroinitializer

`

``

1283

`+

; CHECK-NEXT: [[INDUCTION:%.*]] = add <4 x i32> [[DOTSPLAT]], <i32 0, i32 1, i32 2, i32 3>

`

``

1284

`+

; CHECK-NEXT: [[TMP21:%.*]] = insertelement <4 x i32> zeroinitializer, i32 [[BC_MERGE_RDX]], i32 0

`

``

1285

`+

; CHECK-NEXT: [[BROADCAST_SPLATINSERT13:%.*]] = insertelement <4 x i64> poison, i64 [[N]], i64 0

`

``

1286

`+

; CHECK-NEXT: [[BROADCAST_SPLAT14:%.*]] = shufflevector <4 x i64> [[BROADCAST_SPLATINSERT13]], <4 x i64> poison, <4 x i32> zeroinitializer

`

``

1287

`+

; CHECK-NEXT: br label [[VEC_EPILOG_VECTOR_BODY:%.*]]

`

``

1288

`+

; CHECK: vec.epilog.vector.body:

`

``

1289

`+

; CHECK-NEXT: [[INDEX9:%.]] = phi i32 [ [[BC_RESUME_VAL]], [[VEC_EPILOG_PH]] ], [ [[INDEX_NEXT15:%.]], [[VEC_EPILOG_VECTOR_BODY]] ]

`

``

1290

`+

; CHECK-NEXT: [[VEC_IND10:%.]] = phi <4 x i32> [ [[INDUCTION]], [[VEC_EPILOG_PH]] ], [ [[VEC_IND_NEXT11:%.]], [[VEC_EPILOG_VECTOR_BODY]] ]

`

``

1291

`+

; CHECK-NEXT: [[VEC_PHI12:%.]] = phi <4 x i32> [ [[TMP21]], [[VEC_EPILOG_PH]] ], [ [[TMP25:%.]], [[VEC_EPILOG_VECTOR_BODY]] ]

`

``

1292

`+

; CHECK-NEXT: [[TMP22:%.*]] = zext <4 x i32> [[VEC_IND10]] to <4 x i64>

`

``

1293

`+

; CHECK-NEXT: [[TMP23:%.*]] = icmp eq <4 x i64> [[BROADCAST_SPLAT14]], [[TMP22]]

`

``

1294

`+

; CHECK-NEXT: [[TMP24:%.*]] = select <4 x i1> [[TMP23]], <4 x i32> zeroinitializer, <4 x i32> splat (i32 2)

`

``

1295

`+

; CHECK-NEXT: [[TMP25]] = or <4 x i32> [[TMP24]], [[VEC_PHI12]]

`

``

1296

`+

; CHECK-NEXT: [[INDEX_NEXT15]] = add nuw i32 [[INDEX9]], 4

`

``

1297

`+

; CHECK-NEXT: [[VEC_IND_NEXT11]] = add <4 x i32> [[VEC_IND10]], splat (i32 4)

`

``

1298

`+

; CHECK-NEXT: [[TMP26:%.*]] = icmp eq i32 [[INDEX_NEXT15]], [[N_VEC8]]

`

``

1299

`+

; CHECK-NEXT: br i1 [[TMP26]], label [[VEC_EPILOG_MIDDLE_BLOCK:%.*]], label [[VEC_EPILOG_VECTOR_BODY]], !llvm.loop [[LOOP31:![0-9]+]]

`

``

1300

`+

; CHECK: vec.epilog.middle.block:

`

``

1301

`+

; CHECK-NEXT: [[TMP27:%.*]] = call i32 @llvm.vector.reduce.or.v4i32(<4 x i32> [[TMP25]])

`

``

1302

`+

; CHECK-NEXT: [[CMP_N16:%.*]] = icmp eq i32 [[TMP1]], [[N_VEC8]]

`

``

1303

`+

; CHECK-NEXT: br i1 [[CMP_N16]], label [[EXIT]], label [[VEC_EPILOG_SCALAR_PH]]

`

``

1304

`+

; CHECK: vec.epilog.scalar.ph:

`

``

1305

`+

; CHECK-NEXT: [[BC_RESUME_VAL17:%.]] = phi i32 [ [[N_VEC8]], [[VEC_EPILOG_MIDDLE_BLOCK]] ], [ 0, [[VECTOR_SCEVCHECK]] ], [ 0, [[ITER_CHECK:%.]] ], [ [[N_VEC]], [[VEC_EPILOG_ITER_CHECK]] ]

`

``

1306

`+

; CHECK-NEXT: [[BC_MERGE_RDX18:%.*]] = phi i32 [ [[TMP27]], [[VEC_EPILOG_MIDDLE_BLOCK]] ], [ 0, [[VECTOR_SCEVCHECK]] ], [ 0, [[ITER_CHECK]] ], [ [[TMP20]], [[VEC_EPILOG_ITER_CHECK]] ]

`

``

1307

`+

; CHECK-NEXT: br label [[LOOP:%.*]]

`

``

1308

`+

; CHECK: loop:

`

``

1309

`+

; CHECK-NEXT: [[IV:%.]] = phi i32 [ [[BC_RESUME_VAL17]], [[VEC_EPILOG_SCALAR_PH]] ], [ [[IV_NEXT:%.]], [[LOOP]] ]

`

``

1310

`+

; CHECK-NEXT: [[SELECT:%.]] = phi i32 [ [[BC_MERGE_RDX18]], [[VEC_EPILOG_SCALAR_PH]] ], [ [[SELECT_NEXT:%.]], [[LOOP]] ]

`

``

1311

`+

; CHECK-NEXT: [[IV_WIDEN:%.*]] = zext i32 [[IV]] to i64

`

``

1312

`+

; CHECK-NEXT: [[EXITCOND:%.*]] = icmp eq i64 [[N]], [[IV_WIDEN]]

`

``

1313

`+

; CHECK-NEXT: [[SELECT_I:%.*]] = select i1 [[EXITCOND]], i32 0, i32 2

`

``

1314

`+

; CHECK-NEXT: [[SELECT_NEXT]] = or i32 [[SELECT_I]], [[SELECT]]

`

``

1315

`+

; CHECK-NEXT: [[IV_NEXT]] = add i32 [[IV]], 1

`

``

1316

`+

; CHECK-NEXT: br i1 [[EXITCOND]], label [[EXIT]], label [[LOOP]], !llvm.loop [[LOOP32:![0-9]+]]

`

``

1317

`+

; CHECK: exit:

`

``

1318

`+

; CHECK-NEXT: [[SELECT_NEXT_LCSSA:%.*]] = phi i32 [ [[SELECT_NEXT]], [[LOOP]] ], [ [[TMP20]], [[MIDDLE_BLOCK]] ], [ [[TMP27]], [[VEC_EPILOG_MIDDLE_BLOCK]] ]

`

``

1319

`+

; CHECK-NEXT: ret i32 [[SELECT_NEXT_LCSSA]]

`

``

1320

`+

;

`

``

1321

`+

entry:

`

``

1322

`+

br label %loop

`

``

1323

+

``

1324

`+

loop:

`

``

1325

`+

%iv = phi i32 [ 0, %entry ], [ %iv.next, %loop ]

`

``

1326

`+

%select = phi i32 [ 0, %entry ], [ %select.next, %loop ]

`

``

1327

`+

%iv.widen = zext i32 %iv to i64

`

``

1328

`+

%exitcond = icmp eq i64 %n, %iv.widen

`

``

1329

`+

%select.i = select i1 %exitcond, i32 0, i32 2

`

``

1330

`+

%select.next = or i32 %select.i, %select

`

``

1331

`+

%iv.next = add i32 %iv, 1

`

``

1332

`+

br i1 %exitcond, label %exit, label %loop

`

``

1333

+

``

1334

`+

exit:

`

``

1335

`+

ret i32 %select.next

`

``

1336

`+

}

`

``

1337

+

1214

1338

`declare void @llvm.assume(i1 noundef) #0

`

1215

1339

``

1216

1340

`attributes #0 = { "target-cpu"="penryn" }

`