Fixed WSL cuda's OOM error (#1594)

* In the function , add the cuda error bypass. * remove excessive codes and prints --------- Co-authored-by: liang <liangmanlai@126.com>
2024-12-26 14:20:31 +01:00 · 2023-06-11 21:20:52 +08:00 · 2023-06-11 21:20:52 +08:00 · 12b063f0ec
commit 12b063f0ec
parent 31d2b5f4a4
1 changed files with 3 additions and 0 deletions
--- a/ggml-cuda.cu
+++ b/ggml-cuda.cu
@ -1105,6 +1105,9 @@ void * ggml_cuda_host_malloc(size_t size) {
    void * ptr = nullptr;
    cudaError_t err = cudaMallocHost((void **) &ptr, size);
    if (err != cudaSuccess) {
        // The allocation error can be bypassed. A null ptr will assigned out of this function.
        // This can fixed the OOM error in WSL.
        cudaGetLastError();
        fprintf(stderr, "WARNING: failed to allocate %.2f MB of pinned memory: %s\n",
            size/1024.0/1024.0, cudaGetErrorString(err));
        return nullptr;