@@ -1220,6 +1220,7 @@ template <bool need_check> static __global__ void
1220
1220
load_tiles_q4_0<arch_config.y , arch_config.nwarps , need_check>, VDR_Q4_0_Q8_1_MMQ, vec_dot_q4_0_q8_1_mul_mat>
1221
1221
(vx, vy, dst, ncols_x, nrows_x, ncols_y, nrows_y, nrows_dst);
1222
1222
#else
1223
+ GGML_UNUSED (get_arch_config_device);
1223
1224
GGML_UNUSED (vec_dot_q4_0_q8_1_mul_mat);
1224
1225
NO_DEVICE_CODE;
1225
1226
#endif // __CUDA_ARCH__ >= MIN_CC_DP4A
@@ -1244,6 +1245,7 @@ template <bool need_check> static __global__ void
1244
1245
load_tiles_q4_1<arch_config.y , arch_config.nwarps , need_check>, VDR_Q4_1_Q8_1_MMQ, vec_dot_q4_1_q8_1_mul_mat>
1245
1246
(vx, vy, dst, ncols_x, nrows_x, ncols_y, nrows_y, nrows_dst);
1246
1247
#else
1248
+ GGML_UNUSED (get_arch_config_device);
1247
1249
GGML_UNUSED (vec_dot_q4_1_q8_1_mul_mat);
1248
1250
NO_DEVICE_CODE;
1249
1251
#endif // __CUDA_ARCH__ >= MIN_CC_DP4A
@@ -1266,6 +1268,7 @@ template <bool need_check> static __global__ void
1266
1268
load_tiles_q5_0<arch_config.y , arch_config.nwarps , need_check>, VDR_Q5_0_Q8_1_MMQ, vec_dot_q5_0_q8_1_mul_mat>
1267
1269
(vx, vy, dst, ncols_x, nrows_x, ncols_y, nrows_y, nrows_dst);
1268
1270
#else
1271
+ GGML_UNUSED (get_arch_config_device);
1269
1272
GGML_UNUSED (vec_dot_q5_0_q8_1_mul_mat);
1270
1273
NO_DEVICE_CODE;
1271
1274
#endif // __CUDA_ARCH__ >= MIN_CC_DP4A
@@ -1288,6 +1291,7 @@ mul_mat_q5_1(
1288
1291
load_tiles_q5_1<arch_config.y , arch_config.nwarps , need_check>, VDR_Q5_1_Q8_1_MMQ, vec_dot_q5_1_q8_1_mul_mat>
1289
1292
(vx, vy, dst, ncols_x, nrows_x, ncols_y, nrows_y, nrows_dst);
1290
1293
#else
1294
+ GGML_UNUSED (get_arch_config_device);
1291
1295
GGML_UNUSED (vec_dot_q5_1_q8_1_mul_mat);
1292
1296
NO_DEVICE_CODE;
1293
1297
#endif // __CUDA_ARCH__ >= MIN_CC_DP4A
@@ -1310,6 +1314,7 @@ template <bool need_check> static __global__ void
1310
1314
load_tiles_q8_0<arch_config.y , arch_config.nwarps , need_check>, VDR_Q8_0_Q8_1_MMQ, vec_dot_q8_0_q8_1_mul_mat>
1311
1315
(vx, vy, dst, ncols_x, nrows_x, ncols_y, nrows_y, nrows_dst);
1312
1316
#else
1317
+ GGML_UNUSED (get_arch_config_device);
1313
1318
GGML_UNUSED (vec_dot_q8_0_q8_1_mul_mat);
1314
1319
NO_DEVICE_CODE;
1315
1320
#endif // __CUDA_ARCH__ >= MIN_CC_DP4A
@@ -1332,6 +1337,7 @@ mul_mat_q2_K(
1332
1337
load_tiles_q2_K<arch_config.y , arch_config.nwarps , need_check>, VDR_Q2_K_Q8_1_MMQ, vec_dot_q2_K_q8_1_mul_mat>
1333
1338
(vx, vy, dst, ncols_x, nrows_x, ncols_y, nrows_y, nrows_dst);
1334
1339
#else
1340
+ GGML_UNUSED (get_arch_config_device);
1335
1341
GGML_UNUSED (vec_dot_q2_K_q8_1_mul_mat);
1336
1342
NO_DEVICE_CODE;
1337
1343
#endif // __CUDA_ARCH__ >= MIN_CC_DP4A
@@ -1356,6 +1362,7 @@ template <bool need_check> static __global__ void
1356
1362
load_tiles_q3_K<arch_config.y , arch_config.nwarps , need_check>, VDR_Q3_K_Q8_1_MMQ, vec_dot_q3_K_q8_1_mul_mat>
1357
1363
(vx, vy, dst, ncols_x, nrows_x, ncols_y, nrows_y, nrows_dst);
1358
1364
#else
1365
+ GGML_UNUSED (get_arch_config_device);
1359
1366
GGML_UNUSED (vec_dot_q3_K_q8_1_mul_mat);
1360
1367
NO_DEVICE_CODE;
1361
1368
#endif // __CUDA_ARCH__ >= MIN_CC_DP4A
@@ -1380,6 +1387,7 @@ template <bool need_check> static __global__ void
1380
1387
load_tiles_q4_K<arch_config.y , arch_config.nwarps , need_check>, VDR_Q4_K_Q8_1_MMQ, vec_dot_q4_K_q8_1_mul_mat>
1381
1388
(vx, vy, dst, ncols_x, nrows_x, ncols_y, nrows_y, nrows_dst);
1382
1389
#else
1390
+ GGML_UNUSED (get_arch_config_device);
1383
1391
GGML_UNUSED (vec_dot_q4_K_q8_1_mul_mat);
1384
1392
NO_DEVICE_CODE;
1385
1393
#endif // __CUDA_ARCH__ >= MIN_CC_DP4A
@@ -1402,6 +1410,7 @@ mul_mat_q5_K(
1402
1410
load_tiles_q5_K<arch_config.y , arch_config.nwarps , need_check>, VDR_Q5_K_Q8_1_MMQ, vec_dot_q5_K_q8_1_mul_mat>
1403
1411
(vx, vy, dst, ncols_x, nrows_x, ncols_y, nrows_y, nrows_dst);
1404
1412
#else
1413
+ GGML_UNUSED (get_arch_config_device);
1405
1414
GGML_UNUSED (vec_dot_q5_K_q8_1_mul_mat);
1406
1415
NO_DEVICE_CODE;
1407
1416
#endif // __CUDA_ARCH__ >= MIN_CC_DP4A
@@ -1426,6 +1435,7 @@ template <bool need_check> static __global__ void
1426
1435
load_tiles_q6_K<arch_config.y , arch_config.nwarps , need_check>, VDR_Q6_K_Q8_1_MMQ, vec_dot_q6_K_q8_1_mul_mat>
1427
1436
(vx, vy, dst, ncols_x, nrows_x, ncols_y, nrows_y, nrows_dst);
1428
1437
#else
1438
+ GGML_UNUSED (get_arch_config_device);
1429
1439
GGML_UNUSED (vec_dot_q6_K_q8_1_mul_mat);
1430
1440
NO_DEVICE_CODE;
1431
1441
#endif // __CUDA_ARCH__ >= MIN_CC_DP4A
0 commit comments