Better memory management in DTensor<T>::allocateOnDevice

alphaville · alphaville · commit 4198ecf55899 · 2024-11-07T23:16:23.000Z
Free all allocated memory if allocation fails
Fix code formatting in testTensor
allocateOnDevice made void
diff --git a/include/tensor.cuh b/include/tensor.cuh
@@ -202,9 +202,8 @@ private:
      * Allocate `size` number of `T` data on the device.
      * @param size number of data elements to allocate
      * @param zero sets allocated data to `0`
-     * @return
      */
-    bool allocateOnDevice(size_t size, bool zero = false);
+    void allocateOnDevice(size_t size, bool zero = false);
 
     /**
      * Create column-major `std::vector` from a row-major one.
@@ -837,23 +836,24 @@ void DTensor<T>::applyLeftGivensRotation(size_t i, size_t j, const T *c, const T
 }
 
 template<typename T>
-inline bool DTensor<T>::allocateOnDevice(size_t size, bool zero) {
-    if (size <= 0) return false;
+inline void DTensor<T>::allocateOnDevice(size_t size, bool zero) {
+    cudaError_t cudaStatus;
+    if (size <= 0) return;
     destroy();
     m_doDestroyData = true;
     size_t buffer_size = size * sizeof(T);
-    bool cudaStatus = cudaMalloc(&m_d_data, buffer_size);
-    if (cudaStatus != cudaSuccess) return false;
+    gpuErrChk(cudaMalloc(&m_d_data, buffer_size));
     if (zero) gpuErrChk(cudaMemset(m_d_data, 0, buffer_size)); // set to zero all elements
 
     if (numMats() > 1) {
         m_doDestroyPtrMatrices = true;
         cudaStatus = cudaMalloc(&m_d_ptrMatrices, numMats() * sizeof(T *));
+        if (cudaStatus != cudaSuccess) {
+            gpuErrChk(cudaFree(m_d_data));
+        }
     } else {
         m_doDestroyPtrMatrices = false;
     }
-
-    return (cudaStatus != cudaSuccess);
 }
 
 template<typename T>
diff --git a/test/testTensor.cu b/test/testTensor.cu
@@ -123,7 +123,7 @@ TEMPLATE_WITH_TYPE_T
 void tensorMoveConstructor() {
     DTensor<T> zero(2, 3, 4, true);
     DTensor<T> x(std::move(zero));
-    DTensor<T> y(DTensor < T > {100, 10, 1000});
+    DTensor<T> y(DTensor<T> {100, 10, 1000});
 }
 
 TEST_F(TensorTest, tensorMoveConstructor) {

Original file line number	Diff line number	Diff line change
`@@ -123,7 +123,7 @@ TEMPLATE_WITH_TYPE_T`
`123`	`123`	`void tensorMoveConstructor() {`
`124`	`124`	`DTensor<T> zero(2, 3, 4, true);`
`125`	`125`	`DTensor<T> x(std::move(zero));`
`126`		`- DTensor<T> y(DTensor < T > {100, 10, 1000});`
	`126`	`+ DTensor<T> y(DTensor<T> {100, 10, 1000});`
`127`	`127`	`}`
`128`	`128`
`129`	`129`	`TEST_F(TensorTest, tensorMoveConstructor) {`