Skip to content

Commit

Permalink
Fix multi GPU on multiple amd architectures with rocblas_initialize() (
Browse files Browse the repository at this point in the history
…ggerganov#5)

* initialize rocblas
  • Loading branch information
YellowRoseCx authored Jul 24, 2023
1 parent 3db70b5 commit 1f6294d
Showing 1 changed file with 5 additions and 0 deletions.
5 changes: 5 additions & 0 deletions ggml-cuda.cu
Original file line number Diff line number Diff line change
Expand Up @@ -10,6 +10,7 @@
#include <hip/hip_runtime.h>
#include <hipblas/hipblas.h>
#include <hip/hip_fp16.h>
#include "rocblas/rocblas.h"
#define CUBLAS_COMPUTE_32F HIPBLAS_R_32F
#define CUBLAS_COMPUTE_32F_FAST_16F HIPBLAS_R_32F
#define CUBLAS_GEMM_DEFAULT HIPBLAS_GEMM_DEFAULT
Expand Down Expand Up @@ -2531,6 +2532,10 @@ void ggml_init_cublas() {
static bool initialized = false;

if (!initialized) {
#ifdef GGML_USE_HIPBLAS
rocblas_initialize();
hipDeviceSynchronize();
#endif
CUDA_CHECK(cudaGetDeviceCount(&g_device_count));
GGML_ASSERT(g_device_count <= GGML_CUDA_MAX_DEVICES);
int64_t total_vram = 0;
Expand Down

0 comments on commit 1f6294d

Please sign in to comment.