Skip to content
Closed
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion library/src/blas1/rocblas_dot_kernels.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -237,7 +237,7 @@ rocblas_dot_kernel_gfx942_gfx950_float_double(rocblas_int n,
V* __restrict__ workspace,
T* __restrict__ out)
{
#if defined(__gfx942__) || defined(__gfx950__)
#if defined(__gfx942__) || defined(__gfx950__) || defined(__gfx9_4_generic__)
int i = blockIdx.x * NB + threadIdx.x;
const auto* x = load_ptr_batch(xa, blockIdx.z, shiftx, stridex);
const auto* y = load_ptr_batch(ya, blockIdx.z, shifty, stridey);
Expand Down
2 changes: 1 addition & 1 deletion library/src/blas2/gemv_device.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -1385,7 +1385,7 @@ rocblas_gemvn_sm_mn_batched_kernel(rocblas_int m,
rocblas_stride stridey,
rocblas_int batch_count)
{
#if defined(__gfx90a__) || defined(__gfx942__) || defined(__gfx950__)
#if defined(__gfx90a__) || defined(__gfx942__) || defined(__gfx950__) || defined(__gfx9_4_generic__)

const int b = blockIdx.x * blockDim.y + threadIdx.y;
if(b >= batch_count)
Expand Down
2 changes: 1 addition & 1 deletion library/src/blas2/rocblas_ger_kernels.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -139,7 +139,7 @@ rocblas_sger_gfx942_gfx950_kernel(rocblas_int m,
int64_t lda,
rocblas_stride strideA)
{
#if defined(__gfx942__) || defined(__gfx950__)
#if defined(__gfx942__) || defined(__gfx950__) || defined(__gfx9_4_generic__)

rocblas_int tx = (blockIdx.x * DIM_X + threadIdx.x) * 2;
rocblas_int col = blockIdx.y;
Expand Down
2 changes: 1 addition & 1 deletion library/src/blas3/rocblas_dgmm_kernels.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -91,7 +91,7 @@ rocblas_dgmm_gfx942_gfx950_kernel(rocblas_int m,
int64_t ldc,
rocblas_stride stride_C)
{
#if defined(__gfx942__) || defined(__gfx950__)
#if defined(__gfx942__) || defined(__gfx950__) || defined(__gfx9_4_generic__)

rocblas_int tx = (blockIdx.x * DIM_X + threadIdx.x) * 2;
rocblas_int ty = blockIdx.y * DIM_Y + threadIdx.y;
Expand Down