Skip to content

Commit 9f5cc09

Browse files
Update gfx1150 GEMM and CONV quick-tune lists.
1 parent ef97d77 commit 9f5cc09

File tree

1 file changed

+238
-0
lines changed

1 file changed

+238
-0
lines changed

mlir/include/mlir/Dialect/Rock/Tuning/QuickTuningPerfconfigs.inc

Lines changed: 238 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -207,6 +207,71 @@ const InitParamsNonAccel PopulateParams::initParametersConvGfx1151[PopulateParam
207207
};
208208
// END_CONV_NonAccel_f32_gfx1151_DEFS
209209

210+
// BEGIN_GEMM_NonAccel_f32_gfx1150_DEFS
211+
const InitParamsNonAccel PopulateParams::initParametersGemmGfx1150[PopulateParams::nInitParametersGemmGfx1150] = {
212+
{64,64,128,4,2,2,1,1,2},
213+
{128,128,128,16,4,2,1,1,2},
214+
{64,64,128,16,2,2,1,1,2},
215+
{64,128,64,16,2,2,1,1,2},
216+
{64,64,64,8,2,2,1,1,2},
217+
{64,128,32,16,2,4,1,1,2},
218+
{256,128,128,8,4,4,1,1,2},
219+
{128,32,32,16,2,4,1,1,2},
220+
{64,32,64,8,4,4,1,1,2},
221+
{128,64,128,4,2,2,1,1,2},
222+
{256,64,128,16,4,4,1,1,2},
223+
{128,64,64,4,4,2,1,1,2},
224+
{64,32,32,16,4,2,1,1,2}
225+
};
226+
// END_GEMM_NonAccel_f32_gfx1150_DEFS
227+
228+
// BEGIN_CONV_NonAccel_f32_gfx1150_DEFS
229+
const InitParamsNonAccel PopulateParams::initParametersConvGfx1150[PopulateParams::nInitParametersConvGfx1150] = {
230+
{64,64,128,16,2,2,1,1,2},
231+
{64,64,128,8,2,2,1,1,2},
232+
{64,64,128,4,2,2,1,1,2},
233+
{64,64,128,4,2,4,1,1,2},
234+
{64,64,128,16,4,2,1,1,2},
235+
{64,64,128,8,2,4,1,1,2},
236+
{64,128,64,16,2,2,1,1,2},
237+
{64,64,128,16,4,4,1,1,2},
238+
{64,64,128,4,4,2,1,1,2},
239+
{128,128,128,16,2,4,1,1,2},
240+
{128,128,128,16,4,2,1,1,2},
241+
{64,64,64,4,2,4,1,1,2},
242+
{64,32,128,4,2,2,1,1,2},
243+
{64,64,64,8,4,2,1,1,2},
244+
{64,64,64,16,2,2,1,1,2},
245+
{128,128,128,4,2,2,1,1,2},
246+
{64,128,64,16,4,2,1,1,2},
247+
{128,128,128,4,2,4,1,1,2},
248+
{64,32,64,4,2,2,1,1,2},
249+
{64,64,32,16,2,2,1,1,2},
250+
{64,32,64,16,2,2,1,1,2},
251+
{128,128,64,8,4,2,1,1,2},
252+
{64,128,64,4,4,4,1,1,2},
253+
{256,128,128,8,2,2,1,1,2},
254+
{64,128,32,16,4,2,1,1,2},
255+
{64,64,32,8,2,4,1,1,2},
256+
{128,32,32,16,2,4,1,1,2},
257+
{128,64,64,16,2,4,1,1,2},
258+
{128,64,32,16,2,2,1,1,2},
259+
{64,32,32,8,2,2,1,1,2},
260+
{64,128,32,8,4,2,1,1,2},
261+
{256,128,128,4,2,4,1,1,2},
262+
{128,128,32,16,2,4,1,1,2},
263+
{256,128,128,16,4,2,1,1,2},
264+
{64,128,32,8,2,4,1,1,2},
265+
{128,64,64,16,4,2,1,1,2},
266+
{256,64,64,16,2,4,1,1,2},
267+
{128,64,64,8,4,4,1,1,2},
268+
{256,32,128,8,2,2,1,1,2},
269+
{256,32,64,8,2,2,1,1,2},
270+
{256,64,32,16,2,2,1,1,2},
271+
{128,64,32,4,2,2,1,1,2}
272+
};
273+
// END_CONV_NonAccel_f32_gfx1150_DEFS
274+
210275
#endif
211276

212277
#ifdef NonAccel_DECLARATIONS_GEN
@@ -251,6 +316,16 @@ static constexpr size_t nInitParametersConvGfx1151 = 34;
251316
static const InitParamsNonAccel initParametersConvGfx1151[nInitParametersConvGfx1151];
252317
// END_CONV_NonAccel_f32_gfx1151_DECS
253318

319+
// BEGIN_GEMM_NonAccel_f32_gfx1150_DECS
320+
static constexpr size_t nInitParametersGemmGfx1150 = 13;
321+
static const InitParamsNonAccel initParametersGemmGfx1150[nInitParametersGemmGfx1150];
322+
// END_GEMM_NonAccel_f32_gfx1150_DECS
323+
324+
// BEGIN_CONV_NonAccel_f32_gfx1150_DECS
325+
static constexpr size_t nInitParametersConvGfx1150 = 42;
326+
static const InitParamsNonAccel initParametersConvGfx1150[nInitParametersConvGfx1150];
327+
// END_CONV_NonAccel_f32_gfx1150_DECS
328+
254329
#endif
255330

256331
#ifdef XDL_DEFINITIONS_GEN
@@ -1382,6 +1457,143 @@ const InitParamsAccel PopulateParamsWmma::initParametersForwardI8ConvGfx1151[Pop
13821457
};
13831458
// END_CONV_Wmma_i8_gfx1151_DEFS
13841459

1460+
// BEGIN_GEMM_Wmma_f16_gfx1150_DEFS
1461+
const InitParamsAccel PopulateParamsWmma::initParametersFp16GemmGfx1150[PopulateParamsWmma::nInitParametersFp16GemmGfx1150] = {
1462+
{64,128,8,32,64,8,1,1,2,true,true},
1463+
{128,256,8,64,64,8,1,1,2,true,true},
1464+
{128,256,4,128,32,8,1,1,2,true,true},
1465+
{64,128,4,32,64,8,1,1,2,true,true},
1466+
{64,64,4,64,64,8,1,1,2,true,true},
1467+
{64,256,8,16,128,8,1,1,2,true,true},
1468+
{16,16,8,16,16,16,1,2,2,true,true},
1469+
{16,16,8,16,16,8,1,2,2,true,true},
1470+
{128,64,8,32,32,8,1,1,2,true,true},
1471+
{128,256,2,128,32,8,1,1,2,true,true},
1472+
{64,64,8,32,64,8,1,1,2,true,true},
1473+
{32,16,8,16,16,16,1,2,2,true,true},
1474+
{32,32,8,16,16,8,1,2,2,true,true},
1475+
{256,128,4,128,64,4,1,1,2,true,true},
1476+
{32,64,4,32,64,16,1,1,2,true,true},
1477+
{256,128,4,64,64,16,1,1,2,true,true},
1478+
{16,16,4,16,16,4,1,2,2,true,true},
1479+
{128,64,4,32,32,4,1,1,2,true,true},
1480+
{64,32,4,16,32,4,1,1,2,true,true},
1481+
{128,128,8,64,32,16,1,1,2,true,true},
1482+
{256,64,8,128,32,8,1,1,2,true,true}
1483+
};
1484+
// END_GEMM_Wmma_f16_gfx1150_DEFS
1485+
1486+
// BEGIN_GEMM_Wmma_i8_gfx1150_DEFS
1487+
const InitParamsAccel PopulateParamsWmma::initParametersI8GemmGfx1150[PopulateParamsWmma::nInitParametersI8GemmGfx1150] = {
1488+
{128,256,4,128,32,16,1,1,2,true,true},
1489+
{128,64,2,64,32,16,1,2,2,true,true},
1490+
{16,16,8,16,16,16,1,2,2,true,true},
1491+
{128,64,8,128,16,16,1,1,2,true,true},
1492+
{128,128,4,128,32,16,1,1,2,true,true},
1493+
{32,256,2,32,64,16,1,1,2,true,true},
1494+
{32,64,4,32,16,16,1,2,2,true,true},
1495+
{64,128,2,64,32,16,1,2,2,true,true},
1496+
{256,256,4,128,32,16,1,1,2,true,true},
1497+
{32,64,8,16,64,16,1,1,2,true,true},
1498+
{128,128,8,32,64,16,1,1,2,true,true},
1499+
{64,256,8,16,128,16,1,1,2,true,true},
1500+
{64,64,4,64,64,16,1,1,2,true,true},
1501+
{256,32,4,128,16,16,1,1,2,true,true},
1502+
{16,16,4,16,16,4,1,2,2,true,true},
1503+
{256,64,4,128,16,16,1,1,2,true,true}
1504+
};
1505+
// END_GEMM_Wmma_i8_gfx1150_DEFS
1506+
1507+
// BEGIN_CONV_Wmma_f16_gfx1150_DEFS
1508+
const InitParamsAccel PopulateParamsWmma::initParametersFp16ConvGfx1150[PopulateParamsWmma::nInitParametersFp16ConvGfx1150] = {
1509+
{64,128,4,64,32,8,1,1,2,true,true},
1510+
{128,64,8,128,16,8,1,1,2,true,true},
1511+
{128,64,4,64,32,8,1,1,2,true,true},
1512+
{64,256,2,64,64,8,1,1,2,true,true},
1513+
{128,128,4,128,32,8,1,1,2,true,true},
1514+
{128,128,8,16,128,8,1,1,2,true,true},
1515+
{64,256,4,64,32,8,1,1,2,true,true},
1516+
{128,64,8,32,32,8,1,1,2,true,true},
1517+
{32,64,4,32,64,4,1,1,2,true,true},
1518+
{128,256,4,128,32,8,1,1,2,true,true},
1519+
{128,128,2,128,32,16,1,1,2,true,true},
1520+
{256,128,8,128,32,8,1,1,2,true,true},
1521+
{128,64,2,128,32,8,1,1,2,true,true},
1522+
{256,256,8,128,32,8,1,1,2,true,true},
1523+
{64,128,8,64,32,8,1,1,2,true,true},
1524+
{64,128,8,64,16,8,1,1,2,true,true},
1525+
{32,128,4,32,64,8,1,1,2,true,true},
1526+
{128,128,8,32,64,8,1,1,2,true,true},
1527+
{256,128,8,64,32,8,1,1,2,true,true},
1528+
{32,128,2,32,128,8,1,1,2,true,true},
1529+
{64,128,2,64,32,8,1,2,2,true,true},
1530+
{256,64,4,64,64,8,1,1,2,true,true},
1531+
{64,128,4,64,16,8,1,2,2,true,true},
1532+
{32,128,2,32,32,8,1,2,2,true,true},
1533+
{128,64,4,128,32,4,1,1,2,true,true},
1534+
{64,256,4,64,16,8,1,2,2,true,true},
1535+
{256,128,8,64,64,8,1,1,2,true,true},
1536+
{64,32,4,32,32,8,1,1,2,true,true},
1537+
{16,128,4,16,128,8,1,1,2,true,true},
1538+
{32,256,2,32,128,8,1,1,2,true,true},
1539+
{128,64,2,32,32,8,1,1,2,true,true},
1540+
{256,64,8,64,32,8,1,1,2,true,true},
1541+
{32,32,4,32,16,8,1,2,2,true,true},
1542+
{256,64,2,32,64,8,1,1,2,true,true},
1543+
{64,64,8,16,64,8,1,2,2,true,true},
1544+
{64,32,8,32,32,8,1,1,2,true,true},
1545+
{16,32,8,16,32,8,1,1,2,true,true},
1546+
{64,64,8,16,32,8,1,2,2,true,true},
1547+
{16,32,4,16,32,8,1,2,2,true,true},
1548+
{128,256,8,128,32,8,1,1,2,true,true},
1549+
{64,128,8,16,128,8,1,2,2,true,true},
1550+
{32,32,8,16,16,8,1,1,2,true,true},
1551+
{256,32,4,64,32,8,1,1,2,true,true},
1552+
{32,64,8,16,16,8,1,2,2,true,true},
1553+
{256,128,8,32,64,8,1,1,2,true,true},
1554+
{32,128,8,32,32,8,1,2,2,true,true},
1555+
{32,16,4,16,16,8,1,1,2,true,true},
1556+
{32,32,8,16,16,8,1,2,2,true,true},
1557+
{16,64,8,16,16,8,1,1,2,true,true},
1558+
{16,32,4,16,16,4,1,1,2,true,true},
1559+
{256,32,8,32,32,8,1,1,2,true,true},
1560+
{16,128,8,16,64,8,1,1,2,true,true},
1561+
{64,32,8,32,16,16,1,1,2,true,true},
1562+
{16,16,4,16,16,4,1,1,2,true,true},
1563+
{128,32,4,16,32,16,1,1,2,true,true},
1564+
{16,16,8,16,16,16,1,1,2,true,true},
1565+
{128,16,4,32,16,8,1,2,2,true,true},
1566+
{64,16,8,32,16,16,1,1,2,true,true},
1567+
{32,16,8,16,16,16,1,1,2,true,true}
1568+
};
1569+
// END_CONV_Wmma_f16_gfx1150_DEFS
1570+
1571+
// BEGIN_CONV_Wmma_i8_gfx1150_DEFS
1572+
const InitParamsAccel PopulateParamsWmma::initParametersForwardI8ConvGfx1150[PopulateParamsWmma::nInitParametersForwardI8ConvGfx1150] = {
1573+
{128,32,4,32,32,16,1,2,2,true,true},
1574+
{16,128,4,16,128,4,1,1,2,true,true},
1575+
{256,32,2,32,32,16,1,1,2,true,true},
1576+
{64,128,4,32,64,8,1,1,2,true,true},
1577+
{256,64,2,64,64,16,1,2,2,true,true},
1578+
{64,64,4,16,64,16,1,1,2,true,true},
1579+
{128,256,2,128,64,8,1,1,2,true,true},
1580+
{128,64,8,128,32,4,1,2,2,true,true},
1581+
{64,64,8,16,64,16,1,1,2,true,true},
1582+
{128,64,4,64,64,4,1,1,2,true,true},
1583+
{128,64,8,64,16,16,1,1,2,true,true},
1584+
{128,128,2,128,32,8,1,2,2,true,true},
1585+
{256,64,8,64,64,8,1,1,2,true,true},
1586+
{256,32,4,64,32,16,1,1,2,true,true},
1587+
{256,32,8,16,32,16,1,1,2,true,true},
1588+
{32,256,4,32,128,4,1,2,2,true,true},
1589+
{64,128,2,32,64,16,1,2,2,true,true},
1590+
{128,16,4,16,16,8,1,1,2,true,true},
1591+
{16,16,8,16,16,8,1,1,2,true,true},
1592+
{256,16,8,16,16,16,1,1,2,true,true},
1593+
{256,32,8,128,32,16,1,1,2,true,true}
1594+
};
1595+
// END_CONV_Wmma_i8_gfx1150_DEFS
1596+
13851597
#endif
13861598

13871599
#ifdef Wmma_DECLARATIONS_GEN
@@ -1476,6 +1688,26 @@ static constexpr size_t nInitParametersForwardI8ConvGfx1151 = 18;
14761688
static const InitParamsAccel initParametersForwardI8ConvGfx1151[nInitParametersForwardI8ConvGfx1151];
14771689
// END_CONV_Wmma_i8_gfx1151_DECS
14781690

1691+
// BEGIN_GEMM_Wmma_f16_gfx1150_DECS
1692+
static constexpr size_t nInitParametersFp16GemmGfx1150 = 21;
1693+
static const InitParamsAccel initParametersFp16GemmGfx1150[nInitParametersFp16GemmGfx1150];
1694+
// END_GEMM_Wmma_f16_gfx1150_DECS
1695+
1696+
// BEGIN_GEMM_Wmma_i8_gfx1150_DECS
1697+
static constexpr size_t nInitParametersI8GemmGfx1150 = 16;
1698+
static const InitParamsAccel initParametersI8GemmGfx1150[nInitParametersI8GemmGfx1150];
1699+
// END_GEMM_Wmma_i8_gfx1150_DECS
1700+
1701+
// BEGIN_CONV_Wmma_f16_gfx1150_DECS
1702+
static constexpr size_t nInitParametersFp16ConvGfx1150 = 59;
1703+
static const InitParamsAccel initParametersFp16ConvGfx1150[nInitParametersFp16ConvGfx1150];
1704+
// END_CONV_Wmma_f16_gfx1150_DECS
1705+
1706+
// BEGIN_CONV_Wmma_i8_gfx1150_DECS
1707+
static constexpr size_t nInitParametersForwardI8ConvGfx1150 = 21;
1708+
static const InitParamsAccel initParametersForwardI8ConvGfx1150[nInitParametersForwardI8ConvGfx1150];
1709+
// END_CONV_Wmma_i8_gfx1150_DECS
1710+
14791711
#endif
14801712

14811713
#ifdef NonAccel_LOOKUP_TABLE_GEN
@@ -1488,6 +1720,8 @@ static const InitParamsAccel initParametersForwardI8ConvGfx1151[nInitParametersF
14881720
{"gfx1201_conv_f32", {PopulateParams::initParametersConvGfx1201, PopulateParams::nInitParametersConvGfx1201}},
14891721
{"gfx1151_gemm_f32", {PopulateParams::initParametersGemmGfx1151, PopulateParams::nInitParametersGemmGfx1151}},
14901722
{"gfx1151_conv_f32", {PopulateParams::initParametersConvGfx1151, PopulateParams::nInitParametersConvGfx1151}},
1723+
{"gfx1150_gemm_f32", {PopulateParams::initParametersGemmGfx1150, PopulateParams::nInitParametersGemmGfx1150}},
1724+
{"gfx1150_conv_f32", {PopulateParams::initParametersConvGfx1150, PopulateParams::nInitParametersConvGfx1150}},
14911725

14921726
#endif
14931727

@@ -1537,5 +1771,9 @@ static const InitParamsAccel initParametersForwardI8ConvGfx1151[nInitParametersF
15371771
{"gfx1151_gemm_i8", {PopulateParamsWmma::initParametersI8GemmGfx1151, PopulateParamsWmma::nInitParametersI8GemmGfx1151}},
15381772
{"gfx1151_conv_f16", {PopulateParamsWmma::initParametersFp16ConvGfx1151, PopulateParamsWmma::nInitParametersFp16ConvGfx1151}},
15391773
{"gfx1151_conv_i8", {PopulateParamsWmma::initParametersForwardI8ConvGfx1151, PopulateParamsWmma::nInitParametersForwardI8ConvGfx1151}},
1774+
{"gfx1150_gemm_f16", {PopulateParamsWmma::initParametersFp16GemmGfx1150, PopulateParamsWmma::nInitParametersFp16GemmGfx1150}},
1775+
{"gfx1150_gemm_i8", {PopulateParamsWmma::initParametersI8GemmGfx1150, PopulateParamsWmma::nInitParametersI8GemmGfx1150}},
1776+
{"gfx1150_conv_f16", {PopulateParamsWmma::initParametersFp16ConvGfx1150, PopulateParamsWmma::nInitParametersFp16ConvGfx1150}},
1777+
{"gfx1150_conv_i8", {PopulateParamsWmma::initParametersForwardI8ConvGfx1150, PopulateParamsWmma::nInitParametersForwardI8ConvGfx1150}},
15401778

15411779
#endif

0 commit comments

Comments
 (0)