ggerganov commited on
Commit
46033e6
·
unverified ·
1 Parent(s): 7006035

cuda : fix HIPBLAS build

Browse files
Files changed (2) hide show
  1. extra/sync-ggml.sh +1 -1
  2. ggml-cuda.cu +6 -0
extra/sync-ggml.sh CHANGED
@@ -1,12 +1,12 @@
1
  #!/bin/bash
2
 
3
  cp -rpv ../ggml/src/ggml.c ./ggml.c
 
4
  cp -rpv ../ggml/src/ggml-alloc.c ./ggml-alloc.c
5
  cp -rpv ../ggml/src/ggml-backend-impl.h ./ggml-backend-impl.h
6
  cp -rpv ../ggml/src/ggml-backend.c ./ggml-backend.c
7
  cp -rpv ../ggml/src/ggml-cuda.cu ./ggml-cuda.cu
8
  cp -rpv ../ggml/src/ggml-cuda.h ./ggml-cuda.h
9
- cp -rpv ../ggml/src/ggml-impl.h ./ggml-impl.h
10
  cp -rpv ../ggml/src/ggml-metal.h ./ggml-metal.h
11
  cp -rpv ../ggml/src/ggml-metal.m ./ggml-metal.m
12
  cp -rpv ../ggml/src/ggml-metal.metal ./ggml-metal.metal
 
1
  #!/bin/bash
2
 
3
  cp -rpv ../ggml/src/ggml.c ./ggml.c
4
+ cp -rpv ../ggml/src/ggml-impl.h ./ggml-impl.h
5
  cp -rpv ../ggml/src/ggml-alloc.c ./ggml-alloc.c
6
  cp -rpv ../ggml/src/ggml-backend-impl.h ./ggml-backend-impl.h
7
  cp -rpv ../ggml/src/ggml-backend.c ./ggml-backend.c
8
  cp -rpv ../ggml/src/ggml-cuda.cu ./ggml-cuda.cu
9
  cp -rpv ../ggml/src/ggml-cuda.h ./ggml-cuda.h
 
10
  cp -rpv ../ggml/src/ggml-metal.h ./ggml-metal.h
11
  cp -rpv ../ggml/src/ggml-metal.m ./ggml-metal.m
12
  cp -rpv ../ggml/src/ggml-metal.metal ./ggml-metal.metal
ggml-cuda.cu CHANGED
@@ -39,6 +39,7 @@
39
  #define cudaDeviceCanAccessPeer hipDeviceCanAccessPeer
40
  #define cudaDeviceDisablePeerAccess hipDeviceDisablePeerAccess
41
  #define cudaDeviceEnablePeerAccess hipDeviceEnablePeerAccess
 
42
  #define cudaDeviceProp hipDeviceProp_t
43
  #define cudaDeviceSynchronize hipDeviceSynchronize
44
  #define cudaError_t hipError_t
@@ -48,6 +49,7 @@
48
  #define cudaEvent_t hipEvent_t
49
  #define cudaEventDestroy hipEventDestroy
50
  #define cudaFree hipFree
 
51
  #define cudaFreeHost hipHostFree
52
  #define cudaGetDevice hipGetDevice
53
  #define cudaGetDeviceCount hipGetDeviceCount
@@ -55,6 +57,7 @@
55
  #define cudaGetErrorString hipGetErrorString
56
  #define cudaGetLastError hipGetLastError
57
  #define cudaMalloc hipMalloc
 
58
  #define cudaMallocHost(ptr, size) hipHostMalloc(ptr, size, hipHostMallocDefault)
59
  #define cudaMemcpy hipMemcpy
60
  #define cudaMemcpy2DAsync hipMemcpy2DAsync
@@ -63,6 +66,9 @@
63
  #define cudaMemcpyDeviceToHost hipMemcpyDeviceToHost
64
  #define cudaMemcpyHostToDevice hipMemcpyHostToDevice
65
  #define cudaMemcpyKind hipMemcpyKind
 
 
 
66
  #define cudaMemset hipMemset
67
  #define cudaMemsetAsync hipMemsetAsync
68
  #define cudaOccupancyMaxPotentialBlockSize hipOccupancyMaxPotentialBlockSize
 
39
  #define cudaDeviceCanAccessPeer hipDeviceCanAccessPeer
40
  #define cudaDeviceDisablePeerAccess hipDeviceDisablePeerAccess
41
  #define cudaDeviceEnablePeerAccess hipDeviceEnablePeerAccess
42
+ #define cudaDeviceGetMemPool hipDeviceGetMemPool
43
  #define cudaDeviceProp hipDeviceProp_t
44
  #define cudaDeviceSynchronize hipDeviceSynchronize
45
  #define cudaError_t hipError_t
 
49
  #define cudaEvent_t hipEvent_t
50
  #define cudaEventDestroy hipEventDestroy
51
  #define cudaFree hipFree
52
+ #define cudaFreeAsync hipFreeAsync
53
  #define cudaFreeHost hipHostFree
54
  #define cudaGetDevice hipGetDevice
55
  #define cudaGetDeviceCount hipGetDeviceCount
 
57
  #define cudaGetErrorString hipGetErrorString
58
  #define cudaGetLastError hipGetLastError
59
  #define cudaMalloc hipMalloc
60
+ #define cudaMallocFromPoolAsync hipMallocFromPoolAsync
61
  #define cudaMallocHost(ptr, size) hipHostMalloc(ptr, size, hipHostMallocDefault)
62
  #define cudaMemcpy hipMemcpy
63
  #define cudaMemcpy2DAsync hipMemcpy2DAsync
 
66
  #define cudaMemcpyDeviceToHost hipMemcpyDeviceToHost
67
  #define cudaMemcpyHostToDevice hipMemcpyHostToDevice
68
  #define cudaMemcpyKind hipMemcpyKind
69
+ #define cudaMemPool_t hipMemPool_t
70
+ #define cudaMemPoolAttrReleaseThreshold hipMemPoolAttrReleaseThreshold
71
+ #define cudaMemPoolSetAttribute hipMemPoolSetAttribute
72
  #define cudaMemset hipMemset
73
  #define cudaMemsetAsync hipMemsetAsync
74
  #define cudaOccupancyMaxPotentialBlockSize hipOccupancyMaxPotentialBlockSize