Skip to content

Commit 76f3131

Browse files
author
Chao Liu
committed
tidy
1 parent d184289 commit 76f3131

File tree

6 files changed

+6
-15
lines changed

6 files changed

+6
-15
lines changed

CMakeLists.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -40,7 +40,7 @@ message(STATUS "Build with HIP ${hip_VERSION}")
4040

4141
## half
4242
#find_path(HALF_INCLUDE_DIR half.hpp)
43-
#message("HALF_INCLUDE_DIR: ${HALF_INCLUDE_DIR}")
43+
message("HALF_INCLUDE_DIR: ${HALF_INCLUDE_DIR}")
4444

4545
## tidy
4646
include(EnableCompilerWarnings)

composable_kernel/include/tensor_operation/gridwise_dynamic_gemm_xdlops_v2r3.hpp

Lines changed: 0 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -411,9 +411,6 @@ struct GridwiseDynamicGemm_k0mk1_k0nk1_mn_xdlops_v2r3
411411
constexpr auto a_block_space_size =
412412
math::integer_least_multiple(a_k0_m_k1_block_desc.GetElementSpaceSize(), max_lds_align);
413413

414-
constexpr auto b_block_space_size =
415-
math::integer_least_multiple(b_k0_n_k1_block_desc.GetElementSpaceSize(), max_lds_align);
416-
417414
FloatAB* p_a_block = p_shared_block;
418415
FloatAB* p_b_block = p_shared_block + a_block_space_size;
419416

@@ -574,8 +571,6 @@ struct GridwiseDynamicGemm_k0mk1_k0nk1_mn_xdlops_v2r3
574571
make_dynamic_naive_tensor_descriptor_packed_v2(make_tuple(
575572
I1, I1, I1, I1, Number<M0>{}, Number<1>{}, Number<M2>{}, Number<1>{}));
576573

577-
StaticBuffer<AddressSpaceEnum_t::Vgpr, FloatC, BlkSize> c_blk_buf_;
578-
579574
// calculate origin of thread output tensor on global memory
580575
// blockwise GEMM c matrix starting index
581576
const auto c_thread_mtx_on_block =

host/driver_offline/CMakeLists.txt

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,6 @@ include_directories(BEFORE
99
${PROJECT_SOURCE_DIR}/composable_kernel/include/problem_transform
1010
${PROJECT_SOURCE_DIR}/composable_kernel/include/driver
1111
${PROJECT_SOURCE_DIR}/external/rocm/include
12-
${PROJECT_SOURCE_DIR}/external/half/include
1312
)
1413

1514
set(CONV_FWD_DRIVER_OFFLINE_SOURCE src/conv_fwd_driver_offline.cpp)

host/driver_offline/include/device_dynamic_convolution_forward_implicit_gemm_v4r4r4_xdlops_nhwc_kyxc_nhwk.hpp

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -338,9 +338,6 @@ void device_dynamic_convolution_forward_implicit_gemm_v4r4r4_xdlops_nhwc_kyxc_nh
338338
const auto K = out_n_ho_wo_k_lengths[I3];
339339
const auto C = wei_k_y_x_c_lengths[I3];
340340

341-
const auto Hi = in_n_hi_wi_c_lengths[I1];
342-
const auto Wi = in_n_hi_wi_c_lengths[I2];
343-
344341
const auto Ho = out_n_ho_wo_k_lengths[I1];
345342
const auto Wo = out_n_ho_wo_k_lengths[I2];
346343

host/driver_offline/src/conv_fwd_driver_offline.cpp

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -20,11 +20,11 @@
2020
#include "device_dynamic_convolution_forward_implicit_gemm_v4r4r4_xdlops_nhwc_kyxc_nhwk.hpp"
2121

2222
#define USE_DYNAMIC_MODE 1
23-
#define USE_CONV_FWD_V4R4_NCHW 0
24-
#define USE_CONV_FWD_V4R4R2_NHWC 0
25-
#define USE_CONV_FWD_V6R1_NCHW 0
23+
#define USE_CONV_FWD_V4R4_NCHW 1
24+
#define USE_CONV_FWD_V4R4R2_NHWC 1
25+
#define USE_CONV_FWD_V6R1_NCHW 1
2626
#define USE_CONV_FWD_V5R1_NCHW 0
27-
#define USE_CONV_FWD_V4R4R2_XDL_NCHW 0
27+
#define USE_CONV_FWD_V4R4R2_XDL_NCHW 1
2828
#define USE_CONV_FWD_V4R4R4_XDL_NHWC 1
2929

3030
enum ConvForwardAlgo

host/host_tensor/CMakeLists.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@ set(HOST_TENSOR_SOURCE
1010
## the library target
1111
add_library(host_tensor SHARED ${HOST_TENSOR_SOURCE})
1212

13-
#target_include_directories(host_tensor SYSTEM PUBLIC $<BUILD_INTERFACE:${HALF_INCLUDE_DIR}>)
13+
target_include_directories(host_tensor SYSTEM PUBLIC $<BUILD_INTERFACE:${HALF_INCLUDE_DIR}>)
1414

1515
target_link_libraries(host_tensor PRIVATE hip::device)
1616
target_link_libraries(host_tensor INTERFACE hip::host)

0 commit comments

Comments
 (0)