gogogo2015
diff --git a/‎caffe2/contrib/nccl/cuda_nccl_op_gpu.cc
+2-2 b/‎caffe2/contrib/nccl/cuda_nccl_op_gpu.cc
+2-2
diff --git a/‎caffe2/contrib/nccl/nccl_ops_test.py
+1-1 b/‎caffe2/contrib/nccl/nccl_ops_test.py
+1-1
diff --git a/‎caffe2/contrib/prof/prof_dag_net.cc
+2-2 b/‎caffe2/contrib/prof/prof_dag_net.cc
+2-2
diff --git a/‎caffe2/contrib/tensorboard/tensorboard_exporter.py
+1-1 b/‎caffe2/contrib/tensorboard/tensorboard_exporter.py
+1-1
diff --git a/‎caffe2/contrib/warpctc/ctc_ops_test.py
+4-4 b/‎caffe2/contrib/warpctc/ctc_ops_test.py
+4-4
diff --git a/‎caffe2/core/blob_gpu_test.cc
+2-2 b/‎caffe2/core/blob_gpu_test.cc
+2-2
diff --git a/‎caffe2/core/context_gpu.cu
+1-1 b/‎caffe2/core/context_gpu.cu
+1-1
diff --git a/‎caffe2/core/context_gpu.h
+3-3 b/‎caffe2/core/context_gpu.h
+3-3
diff --git a/‎caffe2/core/cudnn_wrappers.h
+3-3 b/‎caffe2/core/cudnn_wrappers.h
+3-3
diff --git a/‎caffe2/core/event_gpu.cc
+8-8 b/‎caffe2/core/event_gpu.cc
+8-8
diff --git a/‎caffe2/core/hip/event_hip.cc
+1-1 b/‎caffe2/core/hip/event_hip.cc
+1-1
diff --git a/‎caffe2/core/memonger.cc
+2-2 b/‎caffe2/core/memonger.cc
+2-2
diff --git a/‎caffe2/core/net_async_base.cc
+2-2 b/‎caffe2/core/net_async_base.cc
+2-2
diff --git a/‎caffe2/core/net_async_dag_gpu.cc
+1-1 b/‎caffe2/core/net_async_dag_gpu.cc
+1-1
diff --git a/‎caffe2/core/net_gpu_test.cc
+1-1 b/‎caffe2/core/net_gpu_test.cc
+1-1
diff --git a/‎caffe2/core/operator.cc
+1-1 b/‎caffe2/core/operator.cc
+1-1
diff --git a/‎caffe2/mkl/utils/mkl_memory.cc
+1-1 b/‎caffe2/mkl/utils/mkl_memory.cc
+1-1
diff --git a/‎caffe2/observers/profile_observer_gpu.cc
+2-2 b/‎caffe2/observers/profile_observer_gpu.cc
+2-2
diff --git a/‎caffe2/onnx/backend.cc
+1-1 b/‎caffe2/onnx/backend.cc
+1-1
diff --git a/‎caffe2/operators/load_save_op_gpu.cc
+1-1 b/‎caffe2/operators/load_save_op_gpu.cc
+1-1
diff --git a/‎caffe2/operators/rnn/recurrent_network_executor_gpu.cc
+2-2 b/‎caffe2/operators/rnn/recurrent_network_executor_gpu.cc
+2-2
diff --git a/‎caffe2/proto/caffe2.proto
+1-1 b/‎caffe2/proto/caffe2.proto
+1-1
@@ -11,7 +11,7 @@ nccl::NCCLExecution getNCCLElements(
   // We either do an N-N op, or an N-1 op.
   CAFFE_ENFORCE(op->InputSize() == op->OutputSize() || op->OutputSize() == 1);
   nccl::NCCLExecution ex;
-  ex.stream_gpu_id = context.device_id();
+  ex.stream_gpu_id = context.cuda_gpu_id();
   ex.stream = context.cuda_stream();
   ex.root = op->template GetSingleArgument<int>("root", 0);
   ex.elements.resize(op->InputSize());
@@ -204,7 +204,7 @@ std::pair<std::vector<DeviceOption>, std::vector<DeviceOption>> ncclOpDevInfer(
   for (int i = 0; i < def.input().size(); ++i) {
     DeviceOption dev;
     dev.set_device_type(1);
-    dev.set_device_id(i);
+    dev.set_cuda_gpu_id(i);
     opt.push_back(dev);
   }
   return std::make_pair(opt, opt);
 
@@ -21,7 +21,7 @@
 def gpu_device(i):
     device_option = caffe2_pb2.DeviceOption()
     device_option.device_type = caffe2_pb2.CUDA
-    device_option.device_id = i
+    device_option.cuda_gpu_id = i
     return device_option
 
 
 
@@ -33,9 +33,9 @@ void ProfDAGNet::ValidateOpTensorDevices() {
       had_mismatches = true;
       LOG(INFO) << "== PERFORMANCE WARNING == \n"
                 << " Operator " << node.operator_->debug_def().type()
-                << " expects GPU " << mismatch.second.first.device_id()
+                << " expects GPU " << mismatch.second.first.cuda_gpu_id()
                 << " but tensor [" << mismatch.first << "] is on GPU "
-                << mismatch.second.second.device_id();
+                << mismatch.second.second.cuda_gpu_id();
     }
   }
   if (!had_mismatches) {
 
@@ -177,7 +177,7 @@ def _tf_device(device_option):
     if device_option.device_type == caffe2_pb2.CPU:
         return "/cpu:*"
     if device_option.device_type == caffe2_pb2.CUDA:
-        return "/gpu:{}".format(device_option.device_id)
+        return "/gpu:{}".format(device_option.cuda_gpu_id)
     raise Exception("Unhandled device", device_option)
 
 
 
@@ -79,11 +79,11 @@ def test_ctc_cost_cpu(self):
     def test_ctc_cost_gpu(self):
         self.verify_cost(
             caffe2_pb2.DeviceOption(device_type=caffe2_pb2.CUDA,
-                                    device_id=0),
+                                    cuda_gpu_id=0),
             is_test=False)
         self.verify_cost(
             caffe2_pb2.DeviceOption(device_type=caffe2_pb2.CUDA,
-                                    device_id=0),
+                                    cuda_gpu_id=0),
             is_test=False,
             skip_input_lengths=True)
 
@@ -99,10 +99,10 @@ def test_ctc_forward_only_cpu(self):
     def test_ctc_forward_only_gpu(self):
         self.verify_cost(
             caffe2_pb2.DeviceOption(device_type=caffe2_pb2.CUDA,
-                                    device_id=0),
+                                    cuda_gpu_id=0),
             is_test=True)
         self.verify_cost(
             caffe2_pb2.DeviceOption(device_type=caffe2_pb2.CUDA,
-                                    device_id=0),
+                                    cuda_gpu_id=0),
             is_test=True,
             skip_input_lengths=True)
@@ -195,7 +195,7 @@ TEST(TensorTest, TensorSerializationMultiDevices) {
     }
     EXPECT_TRUE(tensor_proto.has_device_detail());
     EXPECT_EQ(tensor_proto.device_detail().device_type(), PROTO_CUDA);
-    EXPECT_EQ(tensor_proto.device_detail().device_id(), gpu_id);
+    EXPECT_EQ(tensor_proto.device_detail().cuda_gpu_id(), gpu_id);
     // Test if the restored blob is still of the same device.
     blob.Reset();
     EXPECT_NO_THROW(DeserializeBlob(serialized, &blob));
@@ -205,7 +205,7 @@ TEST(TensorTest, TensorSerializationMultiDevices) {
     // Test if we force the restored blob on a different device, we
     // can still get so.
     blob.Reset();
-    proto.mutable_tensor()->mutable_device_detail()->set_device_id(0);
+    proto.mutable_tensor()->mutable_device_detail()->set_cuda_gpu_id(0);
     EXPECT_NO_THROW(DeserializeBlob(proto.SerializeAsString(), &blob));
     EXPECT_TRUE(BlobIsTensorType(blob, CUDA));
     EXPECT_EQ(GetGPUIDForPointer(blob.Get<TensorCUDA>().data<float>()), 0);
 
@@ -256,7 +256,7 @@ CUDAContext::CUDAContext(const int gpu_id)
 
 CUDAContext::CUDAContext(const DeviceOption& option)
     : gpu_id_(
-          option.has_device_id() ? RectifyGPUID(option.device_id())
+          option.has_cuda_gpu_id() ? RectifyGPUID(option.cuda_gpu_id())
                                    : CaffeCudaGetDevice()),
       random_seed_(
           option.has_random_seed() ? option.random_seed()
 
@@ -184,7 +184,7 @@ class CAFFE2_CUDA_API CUDAContext final : public BaseContext {
     }
   }
 
-  inline int device_id() const {
+  inline int cuda_gpu_id() const {
     return gpu_id_;
   }
 
@@ -283,7 +283,7 @@ class CAFFE2_CUDA_API CUDAContext final : public BaseContext {
   }
 
   static bool IsStreamFree(const DeviceOption& option, int stream_id) {
-    auto stream = CUDAContext::cuda_stream(option.device_id(), stream_id);
+    auto stream = CUDAContext::cuda_stream(option.cuda_gpu_id(), stream_id);
     return cudaStreamQuery(stream) == cudaSuccess;
   }
 
@@ -393,7 +393,7 @@ class CAFFE2_CUDA_API CUDAStaticContext final : public BaseStaticContext {
 
   void ExtractDeviceOption(DeviceOption* device, const void* data) override {
     device->set_device_type(TypeToProto(GetDeviceType()));
-    device->set_device_id(GetGPUIDForPointer(data));
+    device->set_cuda_gpu_id(GetGPUIDForPointer(data));
   }
 
  protected:
 
@@ -122,17 +122,17 @@ class CuDNNWrapper {
   void with_cudnn_state(size_t state_idx, F&& f) {
     CAFFE_ENFORCE(
         state_idx < CAFFE2_COMPILE_TIME_MAX_CUDNN_STATES, "Invalid state_idx");
-    auto& sync_state = cudnn_states()[context_->device_id()][state_idx];
+    auto& sync_state = cudnn_states()[context_->cuda_gpu_id()][state_idx];
 
-    DeviceGuard dg(context_->device_id());
+    DeviceGuard dg(context_->cuda_gpu_id());
 
     // We need to serialize execution on the CuDNNState as we can't
     // allow multiple threads to race through the cudaEventRecord
     // calls (so a worker thread might wait on another worker thread's
     // execution)
     std::lock_guard<std::mutex> g(sync_state.mutex);
     if (!sync_state.state.get()) {
-      sync_state.state.reset(new CuDNNState(context_->device_id()));
+      sync_state.state.reset(new CuDNNState(context_->cuda_gpu_id()));
     }
     CHECK_NOTNULL(sync_state.state.get())->execute(context_->cuda_stream(), f);
   }
 
@@ -9,21 +9,21 @@ namespace caffe2 {
 struct CudaEventWrapper {
   explicit CudaEventWrapper(const DeviceOption& option)
       : cuda_stream_(nullptr),
-        device_id_(option.device_id()),
+        cuda_gpu_id_(option.cuda_gpu_id()),
         status_(EventStatus::EVENT_INITIALIZED) {
     CAFFE_ENFORCE(option.device_type(), PROTO_CUDA);
-    DeviceGuard g(device_id_);
+    DeviceGuard g(cuda_gpu_id_);
     CUDA_ENFORCE(cudaEventCreate(
         &cuda_event_, cudaEventDefault | cudaEventDisableTiming));
   }
   ~CudaEventWrapper() {
-    DeviceGuard g(device_id_);
+    DeviceGuard g(cuda_gpu_id_);
     CUDA_CHECK(cudaEventDestroy(cuda_event_));
   }
 
   cudaEvent_t cuda_event_;
   cudaStream_t cuda_stream_;
-  int device_id_;
+  int cuda_gpu_id_;
 
   std::atomic<int> status_;
   std::mutex mutex_recorded_;
@@ -65,12 +65,12 @@ void EventRecordCUDA(Event* event, const void* context, const char* err_msg) {
       const auto& current_device = CaffeCudaGetDevice();
       CAFFE_ENFORCE_EQ(
           current_device,
-          wrapper->device_id_,
+          wrapper->cuda_gpu_id_,
           "When you call EventRecordCUDA, your current device should be the same "
           "as the device specified by the event.");
       CAFFE_ENFORCE_EQ(
           current_device,
-          static_cast<const CUDAContext*>(context)->device_id());
+          static_cast<const CUDAContext*>(context)->cuda_gpu_id());
       CUDA_ENFORCE(cudaEventRecord(
           wrapper->cuda_event_,
           static_cast<const CUDAContext*>(context)->cuda_stream()));
@@ -96,7 +96,7 @@ void EventFinishCUDA(const Event* event) {
 
   if (wrapper->status_ == EventStatus::EVENT_SCHEDULED) {
     // ok, even if event is already completed and status was not yet updated
-    DeviceGuard g(wrapper->device_id_);
+    DeviceGuard g(wrapper->cuda_gpu_id_);
     auto cudaResult = cudaEventSynchronize(wrapper->cuda_event_);
     if (cudaResult == cudaSuccess) {
       wrapper->status_ = EventStatus::EVENT_SUCCESS;
@@ -127,7 +127,7 @@ void EventWaitCUDACUDA(const Event* event, void* context) {
     if (context_stream != event_stream) {
       // CAFFE_ENFORCE_EQ(
       //    CaffeCudaGetDevice(),
-      //    static_cast<const CUDAContext*>(context)->device_id());
+      //    static_cast<const CUDAContext*>(context)->cuda_gpu_id());
       CUDA_CHECK(cudaStreamWaitEvent(context_stream, wrapper->cuda_event_, 0));
     }
   }
 
@@ -138,7 +138,7 @@ void EventWaitHIPHIP(const Event* event, void* context)
         {
             // CAFFE_ENFORCE_EQ(
             //    CaffeCudaGetDevice(),
-            //    static_cast<const CUDAContext*>(context)->device_id());
+            //    static_cast<const CUDAContext*>(context)->cuda_gpu_id());
             HIP_CHECK(hipStreamWaitEvent(context_stream, wrapper->hip_event_, 0));
         }
     }
 
@@ -176,7 +176,7 @@ class ComputeBlobRecyclingForDag {
         // cuda device option but whose inputs/outputs are on CPU
         if (net.op(op_index).type() == "CopyGPUToCPU") {
           blob_device_[output].set_device_type(0);
-          blob_device_[output].set_device_id(0);
+          blob_device_[output].set_cuda_gpu_id(0);
         }
       }
     }
@@ -478,7 +478,7 @@ class ComputeBlobRecyclingForDag {
       const DeviceOption& device_option) {
     const DeviceOption& blob_device = blob_device_[blob_name];
     if (device_option.device_type() != blob_device.device_type() ||
-        device_option.device_id() != blob_device.device_id()) {
+        device_option.cuda_gpu_id() != blob_device.cuda_gpu_id()) {
       return false;
     }
     for (const int token : req_tokens_[blob_name]) {
 
@@ -157,7 +157,7 @@ TaskThreadPool* AsyncNetBase::pool(const DeviceOption& device_option) {
         numa_node_id);
     return poolGetter(cpu_pools_, PROTO_CPU, numa_node_id, num_workers_);
   } else if (device_option.device_type() == PROTO_CUDA) {
-    auto gpu_id = device_option.device_id();
+    auto gpu_id = device_option.cuda_gpu_id();
     CAFFE_ENFORCE(
         gpu_id >= 0 && gpu_id < FLAGS_caffe2_net_async_max_gpus,
         "Invalid GPU id: " + caffe2::to_string(gpu_id));
@@ -173,7 +173,7 @@ int AsyncNetBase::stream(int task_id) {
   const auto& device_option = event(task_id).GetDeviceOption();
   int stream_id = 0;
   if (device_option.device_type() == PROTO_CUDA) {
-    int gpu_id = device_option.device_id();
+    int gpu_id = device_option.cuda_gpu_id();
     CAFFE_ENFORCE_GE(gpu_id, 0, "Invalid gpu id: " + caffe2::to_string(gpu_id));
     if ((unsigned)gpu_id >= getStreamCounters().size()) {
       getStreamCounters().resize(gpu_id + 1, 0);
 
@@ -112,7 +112,7 @@ AsyncDAGNet::AsyncDAGNet(
 int AsyncDAGNet::stream(const DeviceOption& device_option) {
   int stream_id = 0;
   if (device_option.device_type() == PROTO_CUDA) {
-    int gpu_id = device_option.device_id();
+    int gpu_id = device_option.cuda_gpu_id();
     CAFFE_ENFORCE_GE(gpu_id, 0, "Invalid gpu id: " + caffe2::to_string(gpu_id));
     if ((unsigned)gpu_id >= stream_counters_.size()) {
       stream_counters_.resize(gpu_id + 1, 0);
 
@@ -124,7 +124,7 @@ TEST(NetTest, DISABLED_ChainingForDifferentDevices) {
           type: "NetTestDummy"
           device_option {
             device_type: 1
-            device_id: 1
+            cuda_gpu_id: 1
           }
         }
 )DOC";
 
@@ -649,7 +649,7 @@ std::map<string, std::pair<DeviceOption, DeviceOption>> ValidateTensorDevices(
           &blob_device);
 
       if (blob_device.device_type() == PROTO_CUDA &&
-          blob_device.device_id() != op_device.device_id()) {
+          blob_device.cuda_gpu_id() != op_device.cuda_gpu_id()) {
         mismatches[blob_name] = std::make_pair(op_device, blob_device);
       } else if (
           blob_device.device_type() == PROTO_HIP &&
 
@@ -26,7 +26,7 @@ static vector<int64_t> GetMKLTensorInfo(
   const mkl::MKLMemory<T>* tc = static_cast<const mkl::MKLMemory<T>*>(c);
   *capacity = tc->size() * sizeof(T);
   device->set_device_type(PROTO_MKLDNN);
-  device->set_device_id(0);
+  device->set_cuda_gpu_id(0);
   return tc->dims();
 }
 
 
@@ -70,7 +70,7 @@ void ProfileOperatorObserver::Start() {
     int device;
     cudaGetDevice(&device);
 
-    cudaSetDevice(context->device_id());
+    cudaSetDevice(context->cuda_gpu_id());
     cudaEventCreate(&start_);
     cudaEventRecord(start_, context->cuda_stream());
 
@@ -92,7 +92,7 @@ void ProfileOperatorObserver::Stop() {
     int device;
     cudaGetDevice(&device);
 
-    cudaSetDevice(context->device_id());
+    cudaSetDevice(context->cuda_gpu_id());
     cudaEventCreate(&stop_);
     cudaEventRecord(stop_, context->cuda_stream());
     cudaEventSynchronize(stop_);
 
@@ -65,7 +65,7 @@ caffe2::DeviceOption GetDeviceOption(const Device& onnx_device) {
       {DeviceType::CUDA, caffe2::DeviceType::CUDA}};
   caffe2::DeviceOption d;
   d.set_device_type(static_cast<int32_t>(m.at(onnx_device.type)));
-  d.set_device_id(onnx_device.device_id);
+  d.set_cuda_gpu_id(onnx_device.device_id);
   return d;
 }
 
 
@@ -9,7 +9,7 @@ void LoadOp<CUDAContext>::SetCurrentDevice(BlobProto* proto) {
     proto->mutable_tensor()->clear_device_detail();
     auto* device_detail = proto->mutable_tensor()->mutable_device_detail();
     device_detail->set_device_type(PROTO_CUDA);
-    device_detail->set_device_id(CaffeCudaGetDevice());
+    device_detail->set_cuda_gpu_id(CaffeCudaGetDevice());
   }
 }
 
 
@@ -72,11 +72,11 @@ void CUDARecurrentNetworkExecutor::_ExecRange(int from, int to) {
       if (gpu_id == -1 &&
           rnn_op.op->device_option().device_type() ==
               DeviceTypeProto::PROTO_CUDA) {
-        gpu_id = rnn_op.op->device_option().device_id();
+        gpu_id = rnn_op.op->device_option().cuda_gpu_id();
       } else {
         CAFFE_ENFORCE(
             rnn_op.op->device_option().device_type() == 0 ||
-                rnn_op.op->device_option().device_id() == gpu_id,
+                rnn_op.op->device_option().cuda_gpu_id() == gpu_id,
             "RNN Executor only supports ops on one GPU");
       }
 
 
@@ -183,7 +183,7 @@ message DeviceOption {
   // optional DeviceType device_type = 1 [ default = CPU ];
   optional int32 device_type = 1 [ default = 0 ]; // 0 is CPU.
   // [CUDA specific] the cuda gpu id.
-  optional int32 device_id = 2;
+  optional int32 cuda_gpu_id = 2;
   // [general] The random seed to start the device random number generator with.
   optional uint32 random_seed = 3;
   // [general] What node this op should execute on.
Original file line number	Diff line number	Diff line change
`@@ -33,9 +33,9 @@ void ProfDAGNet::ValidateOpTensorDevices() {`
`33`	`33`	`had_mismatches = true;`
`34`	`34`	`LOG(INFO) << "== PERFORMANCE WARNING == \n"`
`35`	`35`	`<< " Operator " << node.operator_->debug_def().type()`
`36`		`- << " expects GPU " << mismatch.second.first.device_id()`
	`36`	`+ << " expects GPU " << mismatch.second.first.cuda_gpu_id()`
`37`	`37`	`<< " but tensor [" << mismatch.first << "] is on GPU "`
`38`		`- << mismatch.second.second.device_id();`
	`38`	`+ << mismatch.second.second.cuda_gpu_id();`
`39`	`39`	`}`
`40`	`40`	`}`
`41`	`41`	`if (!had_mismatches) {`
Original file line number	Diff line number	Diff line change
`@@ -184,7 +184,7 @@ class CAFFE2_CUDA_API CUDAContext final : public BaseContext {`
`184`	`184`	`}`
`185`	`185`	`}`
`186`	`186`
`187`		`- inline int device_id() const {`
	`187`	`+ inline int cuda_gpu_id() const {`
`188`	`188`	`return gpu_id_;`
`189`	`189`	`}`
`190`	`190`
`@@ -283,7 +283,7 @@ class CAFFE2_CUDA_API CUDAContext final : public BaseContext {`
`283`	`283`	`}`
`284`	`284`
`285`	`285`	`static bool IsStreamFree(const DeviceOption& option, int stream_id) {`
`286`		`- auto stream = CUDAContext::cuda_stream(option.device_id(), stream_id);`
	`286`	`+ auto stream = CUDAContext::cuda_stream(option.cuda_gpu_id(), stream_id);`
`287`	`287`	`return cudaStreamQuery(stream) == cudaSuccess;`
`288`	`288`	`}`
`289`	`289`
`@@ -393,7 +393,7 @@ class CAFFE2_CUDA_API CUDAStaticContext final : public BaseStaticContext {`
`393`	`393`
`394`	`394`	`void ExtractDeviceOption(DeviceOption* device, const void* data) override {`
`395`	`395`	`device->set_device_type(TypeToProto(GetDeviceType()));`
`396`		`- device->set_device_id(GetGPUIDForPointer(data));`
	`396`	`+ device->set_cuda_gpu_id(GetGPUIDForPointer(data));`
`397`	`397`	`}`
`398`	`398`
`399`	`399`	`protected:`
Original file line number	Diff line number	Diff line change
`@@ -138,7 +138,7 @@ void EventWaitHIPHIP(const Event* event, void* context)`
`138`	`138`	`{`
`139`	`139`	`// CAFFE_ENFORCE_EQ(`
`140`	`140`	`// CaffeCudaGetDevice(),`
`141`		`- // static_cast<const CUDAContext*>(context)->device_id());`
	`141`	`+ // static_cast<const CUDAContext*>(context)->cuda_gpu_id());`
`142`	`142`	`HIP_CHECK(hipStreamWaitEvent(context_stream, wrapper->hip_event_, 0));`
`143`	`143`	`}`
`144`	`144`	`}`
Original file line number	Diff line number	Diff line change
`@@ -176,7 +176,7 @@ class ComputeBlobRecyclingForDag {`
`176`	`176`	`// cuda device option but whose inputs/outputs are on CPU`
`177`	`177`	`if (net.op(op_index).type() == "CopyGPUToCPU") {`
`178`	`178`	`blob_device_[output].set_device_type(0);`
`179`		`- blob_device_[output].set_device_id(0);`
	`179`	`+ blob_device_[output].set_cuda_gpu_id(0);`
`180`	`180`	`}`
`181`	`181`	`}`
`182`	`182`	`}`
`@@ -478,7 +478,7 @@ class ComputeBlobRecyclingForDag {`
`478`	`478`	`const DeviceOption& device_option) {`
`479`	`479`	`const DeviceOption& blob_device = blob_device_[blob_name];`
`480`	`480`	`if (device_option.device_type() != blob_device.device_type() \|\|`
`481`		`- device_option.device_id() != blob_device.device_id()) {`
	`481`	`+ device_option.cuda_gpu_id() != blob_device.cuda_gpu_id()) {`
`482`	`482`	`return false;`
`483`	`483`	`}`
`484`	`484`	`for (const int token : req_tokens_[blob_name]) {`
Original file line number	Diff line number	Diff line change
`@@ -124,7 +124,7 @@ TEST(NetTest, DISABLED_ChainingForDifferentDevices) {`
`124`	`124`	`type: "NetTestDummy"`
`125`	`125`	`device_option {`
`126`	`126`	`device_type: 1`
`127`		`- device_id: 1`
	`127`	`+ cuda_gpu_id: 1`
`128`	`128`	`}`
`129`	`129`	`}`
`130`	`130`	`)DOC";`
Original file line number	Diff line number	Diff line change
`@@ -26,7 +26,7 @@ static vector<int64_t> GetMKLTensorInfo(`
`26`	`26`	`const mkl::MKLMemory<T>* tc = static_cast<const mkl::MKLMemory<T>*>(c);`
`27`	`27`	`capacity = tc->size() sizeof(T);`
`28`	`28`	`device->set_device_type(PROTO_MKLDNN);`
`29`		`- device->set_device_id(0);`
	`29`	`+ device->set_cuda_gpu_id(0);`
`30`	`30`	`return tc->dims();`
`31`	`31`	`}`
`32`	`32`
Original file line number	Diff line number	Diff line change
`@@ -65,7 +65,7 @@ caffe2::DeviceOption GetDeviceOption(const Device& onnx_device) {`
`65`	`65`	`{DeviceType::CUDA, caffe2::DeviceType::CUDA}};`
`66`	`66`	`caffe2::DeviceOption d;`
`67`	`67`	`d.set_device_type(static_cast<int32_t>(m.at(onnx_device.type)));`
`68`		`- d.set_device_id(onnx_device.device_id);`
	`68`	`+ d.set_cuda_gpu_id(onnx_device.device_id);`
`69`	`69`	`return d;`
`70`	`70`	`}`
`71`	`71`
Original file line number	Diff line number	Diff line change
`@@ -9,7 +9,7 @@ void LoadOp<CUDAContext>::SetCurrentDevice(BlobProto* proto) {`
`9`	`9`	`proto->mutable_tensor()->clear_device_detail();`
`10`	`10`	`auto* device_detail = proto->mutable_tensor()->mutable_device_detail();`
`11`	`11`	`device_detail->set_device_type(PROTO_CUDA);`
`12`		`- device_detail->set_device_id(CaffeCudaGetDevice());`
	`12`	`+ device_detail->set_cuda_gpu_id(CaffeCudaGetDevice());`
`13`	`13`	`}`
`14`	`14`	`}`
`15`	`15`