Skip to content
2 changes: 2 additions & 0 deletions csrc/includes/custom_cuda_layers.h
100644 → 100755
Original file line number Diff line number Diff line change
Expand Up @@ -22,6 +22,8 @@
#define MAX_THREAD_ITERATIONS 8 // Maximum 8K
#define MAX_WARP_NUM 32

#define MAX_REGISTERS 256

// Fused bias add with gelu activation
template <typename T>
void launch_bias_gelu(const T* input,
Expand Down
3 changes: 2 additions & 1 deletion csrc/transformer/cublas_wrappers.cu
Original file line number Diff line number Diff line change
Expand Up @@ -133,7 +133,8 @@ int cublas_strided_batched_gemm(cublasHandle_t handle,

if (status != CUBLAS_STATUS_SUCCESS) {
fprintf(stderr,
"!!!! kernel execution error. (m: %d, n: %d, k: %d, error: %d) \n",
"!!!! kernel execution error. (batch: %d, m: %d, n: %d, k: %d, error: %d) \n",
batch,
m,
n,
k,
Expand Down
Loading