Materialize a non-default device for C2 legacy storage. (#18605)

author Gregory Chanan <gchanan@fb.com>

Thu, 11 Apr 2019 20:22:49 +0000 (13:22 -0700)

committer Facebook Github Bot <facebook-github-bot@users.noreply.github.com>

Thu, 11 Apr 2019 20:50:41 +0000 (13:50 -0700)
author Gregory Chanan <gchanan@fb.com>
Thu, 11 Apr 2019 20:22:49 +0000 (13:22 -0700)
committer Facebook Github Bot <facebook-github-bot@users.noreply.github.com>
Thu, 11 Apr 2019 20:50:41 +0000 (13:50 -0700)
diff --git a/c10/core/Storage.h b/c10/core/Storage.h

index 82d8b31..6d86119 100644 (file)
--- a/c10/core/Storage.h
+++ b/c10/core/Storage.h
@@ -41,11 +41,12 @@ struct C10_API Storage {
    // that can be temporarily created with Caffe2 APIs. See the note on top of
    // TensorImpl.h for details.
    static Storage create_legacy(at::Device device, caffe2::TypeMeta data_type) {
+    auto allocator = GetAllocator(device.type());
      return Storage(c10::make_intrusive<StorageImpl>(
              data_type,
              0,
-            at::DataPtr(nullptr, device),
-            GetAllocator(device.type()),
+            allocator->allocate(0), // materialize a non-default Device.
+            allocator,
              true));
    }
  
diff --git a/caffe2/core/context_gpu.cu b/caffe2/core/context_gpu.cu

index d7f7fc6..0bd259e 100644 (file)
--- a/caffe2/core/context_gpu.cu
+++ b/caffe2/core/context_gpu.cu
@@ -485,14 +485,18 @@ struct DefaultCUDAAllocator final : public at::Allocator {
      }
      switch (g_cuda_memory_pool_type) {
        case CudaMemoryPoolType::NONE:
-        CUDA_ENFORCE(cudaMalloc(&ptr, nbytes));
+        if (nbytes != 0) {
+          CUDA_ENFORCE(cudaMalloc(&ptr, nbytes));
+        }
          if (FLAGS_caffe2_gpu_memory_tracking) {
            g_size_map[ptr] = nbytes;
            g_cuda_device_affiliation[ptr] = CaffeCudaGetDevice();
          }
          return {ptr, ptr, &Delete, at::Device(CUDA, CaffeCudaGetDevice())};
        case CudaMemoryPoolType::CUB:
-        CUDA_ENFORCE(g_cub_allocator->DeviceAllocate(&ptr, nbytes));
+        if (nbytes != 0) {
+          CUDA_ENFORCE(g_cub_allocator->DeviceAllocate(&ptr, nbytes));
+        }
          g_cuda_device_affiliation[ptr] = CaffeCudaGetDevice();
          VLOG(2) << "CUB allocating pointer " << ptr << " on device "
                  << CaffeCudaGetDevice();
author	Gregory Chanan <gchanan@fb.com>
	Thu, 11 Apr 2019 20:22:49 +0000 (13:22 -0700)
committer	Facebook Github Bot <facebook-github-bot@users.noreply.github.com>
	Thu, 11 Apr 2019 20:50:41 +0000 (13:50 -0700)
c10/core/Storage.h		patch \| blob \| history
caffe2/core/context_gpu.cu		patch \| blob \| history