kevinch-nv
diff --git a/‎binaries/CMakeLists.txt
Lines changed: 4 additions & 4 deletions b/‎binaries/CMakeLists.txt
Lines changed: 4 additions & 4 deletions
diff --git a/‎caffe2/CMakeLists.txt
Lines changed: 2 additions & 3 deletions b/‎caffe2/CMakeLists.txt
Lines changed: 2 additions & 3 deletions
diff --git a/‎caffe2/core/CMakeLists.txt
Lines changed: 6 additions & 6 deletions b/‎caffe2/core/CMakeLists.txt
Lines changed: 6 additions & 6 deletions
diff --git a/‎caffe2/core/common_gpu.cc
Lines changed: 6 additions & 6 deletions b/‎caffe2/core/common_gpu.cc
Lines changed: 6 additions & 6 deletions
diff --git a/‎caffe2/core/common_gpu.h
Lines changed: 1 addition & 1 deletion b/‎caffe2/core/common_gpu.h
Lines changed: 1 addition & 1 deletion
diff --git a/‎caffe2/core/hip/common_miopen.cc renamed to ‎caffe2/core/hip/common_miopen.hip b/‎caffe2/core/hip/common_miopen.cc renamed to ‎caffe2/core/hip/common_miopen.hip
diff --git a/‎caffe2/core/hip/miopen_wrapper.h
Lines changed: 1 addition & 1 deletion b/‎caffe2/core/hip/miopen_wrapper.h
Lines changed: 1 addition & 1 deletion
diff --git a/‎caffe2/db/CMakeLists.txt
Lines changed: 2 additions & 2 deletions b/‎caffe2/db/CMakeLists.txt
Lines changed: 2 additions & 2 deletions
diff --git a/‎caffe2/image/CMakeLists.txt
Lines changed: 9 additions & 6 deletions b/‎caffe2/image/CMakeLists.txt
Lines changed: 9 additions & 6 deletions
diff --git a/‎caffe2/operators/CMakeLists.txt
Lines changed: 8 additions & 11 deletions b/‎caffe2/operators/CMakeLists.txt
Lines changed: 8 additions & 11 deletions
diff --git a/‎caffe2/operators/hip/activation_ops_miopen.h
Lines changed: 1 addition & 1 deletion b/‎caffe2/operators/hip/activation_ops_miopen.h
Lines changed: 1 addition & 1 deletion
diff --git a/‎caffe2/operators/hip/conv_op_miopen.cc renamed to ‎caffe2/operators/hip/conv_op_miopen.hip
Lines changed: 1 addition & 1 deletion b/‎caffe2/operators/hip/conv_op_miopen.cc renamed to ‎caffe2/operators/hip/conv_op_miopen.hip
Lines changed: 1 addition & 1 deletion
diff --git a/‎caffe2/operators/hip/conv_transpose_op_miopen.cc renamed to ‎caffe2/operators/hip/conv_transpose_op_miopen.hip
Lines changed: 1 addition & 1 deletion b/‎caffe2/operators/hip/conv_transpose_op_miopen.cc renamed to ‎caffe2/operators/hip/conv_transpose_op_miopen.hip
Lines changed: 1 addition & 1 deletion
diff --git a/‎caffe2/operators/hip/elu_op_miopen.cc renamed to ‎caffe2/operators/hip/elu_op_miopen.hip b/‎caffe2/operators/hip/elu_op_miopen.cc renamed to ‎caffe2/operators/hip/elu_op_miopen.hip
diff --git a/‎caffe2/operators/hip/local_response_normalization_op_miopen.cc renamed to ‎caffe2/operators/hip/local_response_normalization_op_miopen.hip
Lines changed: 1 addition & 1 deletion b/‎caffe2/operators/hip/local_response_normalization_op_miopen.cc renamed to ‎caffe2/operators/hip/local_response_normalization_op_miopen.hip
Lines changed: 1 addition & 1 deletion
diff --git a/‎caffe2/operators/hip/pool_op_miopen.cc renamed to ‎caffe2/operators/hip/pool_op_miopen.hip
Lines changed: 1 addition & 1 deletion b/‎caffe2/operators/hip/pool_op_miopen.cc renamed to ‎caffe2/operators/hip/pool_op_miopen.hip
Lines changed: 1 addition & 1 deletion
diff --git a/‎caffe2/operators/hip/relu_op_miopen.cc renamed to ‎caffe2/operators/hip/relu_op_miopen.hip b/‎caffe2/operators/hip/relu_op_miopen.cc renamed to ‎caffe2/operators/hip/relu_op_miopen.hip
diff --git a/‎caffe2/operators/hip/sigmoid_op_miopen.cc renamed to ‎caffe2/operators/hip/sigmoid_op_miopen.hip b/‎caffe2/operators/hip/sigmoid_op_miopen.cc renamed to ‎caffe2/operators/hip/sigmoid_op_miopen.hip
diff --git a/‎caffe2/operators/hip/spatial_batch_norm_op_miopen.cc renamed to ‎caffe2/operators/hip/spatial_batch_norm_op_miopen.hip
Lines changed: 2 additions & 2 deletions b/‎caffe2/operators/hip/spatial_batch_norm_op_miopen.cc renamed to ‎caffe2/operators/hip/spatial_batch_norm_op_miopen.hip
Lines changed: 2 additions & 2 deletions
diff --git a/‎caffe2/operators/hip/tanh_op_miopen.cc renamed to ‎caffe2/operators/hip/tanh_op_miopen.hip b/‎caffe2/operators/hip/tanh_op_miopen.cc renamed to ‎caffe2/operators/hip/tanh_op_miopen.hip
diff --git a/‎caffe2/operators/rnn/CMakeLists.txt
Lines changed: 18 additions & 2 deletions b/‎caffe2/operators/rnn/CMakeLists.txt
Lines changed: 18 additions & 2 deletions
diff --git a/‎caffe2/operators/rnn/hip/recurrent_op_miopen.h
Lines changed: 1 addition & 1 deletion b/‎caffe2/operators/rnn/hip/recurrent_op_miopen.h
Lines changed: 1 addition & 1 deletion
diff --git a/‎caffe2/operators/rnn/hip/recurrent_op_miopen.cc renamed to ‎caffe2/operators/rnn/hip/recurrent_op_miopen.hip b/‎caffe2/operators/rnn/hip/recurrent_op_miopen.cc renamed to ‎caffe2/operators/rnn/hip/recurrent_op_miopen.hip
diff --git a/‎caffe2/python/pybind_state_hip.cc
Lines changed: 2 additions & 2 deletions b/‎caffe2/python/pybind_state_hip.cc
Lines changed: 2 additions & 2 deletions
diff --git a/‎caffe2/queue/CMakeLists.txt
Lines changed: 6 additions & 4 deletions b/‎caffe2/queue/CMakeLists.txt
Lines changed: 6 additions & 4 deletions
@@ -24,13 +24,13 @@ if (USE_CUDA)
 endif()
 
 if (USE_ROCM)
-  caffe2_hip_binary_target("hip/inspect_hip.cc")
-  caffe2_hip_binary_target("hip/print_core_object_sizes_hip.cc")
+  caffe2_hip_binary_target("hip/inspect_gpu.cc")
+  caffe2_hip_binary_target("hip/print_core_object_sizes_gpu.cc")
 
   if (BUILD_TEST)
     # Core overhead benchmark
-    caffe2_hip_binary_target("hip/core_overhead_benchmark_hip.cc")
-    target_link_libraries(core_overhead_benchmark_hip benchmark)
+    caffe2_hip_binary_target("hip/core_overhead_benchmark_gpu.cc")
+    target_link_libraries(core_overhead_benchmark_gpu benchmark)
   endif()
 endif()
 
 
@@ -374,14 +374,14 @@ if(USE_ROCM)
   # Call again since Caffe2_HIP_INCLUDES is extended with ATen include dirs.
   hip_include_directories(${Caffe2_HIP_INCLUDES})
 
-  filter_list(__caffe2_hip_srcs_cpp Caffe2_HIP_SRCS "\\.(cc|cpp|cu)$")
+  filter_list(__caffe2_hip_srcs_cpp Caffe2_HIP_SRCS "\\.(cu|hip)$")
   set_source_files_properties(${__caffe2_hip_srcs_cpp} PROPERTIES HIP_SOURCE_PROPERTY_FORMAT 1)
 
   # FindHIP.CMake checks if the SHARED flag is set and adds extra logic accordingly.
   hip_add_library(caffe2_hip ${Caffe2_HIP_SRCS})
 
   # Since PyTorch files contain HIP headers, these flags are required for the necessary definitions to be added.
-  target_compile_options(caffe2_hip PRIVATE ${HIP_HCC_FLAGS})
+  target_compile_options(caffe2_hip PRIVATE ${HIP_CXX_FLAGS})
   target_link_libraries(caffe2_hip PUBLIC caffe2)
   target_link_libraries(caffe2_hip PUBLIC ${Caffe2_HIP_DEPENDENCY_LIBS})
 
@@ -435,7 +435,6 @@ if (BUILD_TEST)
 
   if(USE_ROCM)
     foreach(test_src ${Caffe2_HIP_TEST_SRCS})
-      set_source_files_properties(${test_src} PROPERTIES HIP_SOURCE_PROPERTY_FORMAT 1)
       get_filename_component(test_name ${test_src} NAME_WE)
       add_executable(${test_name} "${test_src}")
       target_link_libraries(${test_name} ${Caffe2_MAIN_LIBS} gtest_main)
 
@@ -14,14 +14,14 @@ set(Caffe2_GPU_SRCS ${Caffe2_GPU_SRCS} ${tmp})
 file(GLOB tmp *_test.cc)
 exclude(Caffe2_GPU_SRCS "${Caffe2_GPU_SRCS}" ${tmp})
 
-# ---[ HIP files
-file(GLOB_RECURSE tmp *_hip.cc)
+# ---[ general HIP files
+file(GLOB tmp hip/*.cc)
 set(Caffe2_HIP_SRCS ${Caffe2_HIP_SRCS} ${tmp})
-# ------[ MIOpen files
-file(GLOB_RECURSE tmp *_miopen.cc)
+# ------[ HIP sources
+file(GLOB tmp hip/*.hip)
 set(Caffe2_HIP_SRCS ${Caffe2_HIP_SRCS} ${tmp})
 # exclude test files
-file(GLOB_RECURSE tmp *_test.cc)
+file(GLOB tmp hip/*_test.cc)
 exclude(Caffe2_HIP_SRCS "${Caffe2_HIP_SRCS}" ${tmp})
 
 # ---[ CPU files.
@@ -42,7 +42,7 @@ file(GLOB tmp *_gpu_test.cc)
 set(Caffe2_GPU_TEST_SRCS ${Caffe2_GPU_TEST_SRCS} ${tmp})
 
 # ---[ HIP test files
-file(GLOB_RECURSE tmp *_hip_test.cc)
+file(GLOB tmp hip/*_test.cc)
 set(Caffe2_HIP_TEST_SRCS ${Caffe2_HIP_TEST_SRCS} ${tmp})
 
 # ---[ CPU test files
 
@@ -194,7 +194,7 @@ void DeviceQuery(const int device) {
      << std::endl;
   ss << "Total registers per block:     " << prop.regsPerBlock << std::endl;
   ss << "Warp size:                     " << prop.warpSize << std::endl;
-#ifndef __HIPCC__
+#ifndef __HIP_PLATFORM_HCC__
   ss << "Maximum memory pitch:          " << prop.memPitch << std::endl;
 #endif
   ss << "Maximum threads per block:     " << prop.maxThreadsPerBlock
@@ -207,14 +207,14 @@ void DeviceQuery(const int device) {
      << prop.maxGridSize[2] << std::endl;
   ss << "Clock rate:                    " << prop.clockRate << std::endl;
   ss << "Total constant memory:         " << prop.totalConstMem << std::endl;
-#ifndef __HIPCC__
+#ifndef __HIP_PLATFORM_HCC__
   ss << "Texture alignment:             " << prop.textureAlignment << std::endl;
   ss << "Concurrent copy and execution: "
      << (prop.deviceOverlap ? "Yes" : "No") << std::endl;
 #endif
   ss << "Number of multiprocessors:     " << prop.multiProcessorCount
      << std::endl;
-#ifndef __HIPCC__
+#ifndef __HIP_PLATFORM_HCC__
   ss << "Kernel execution timeout:      "
      << (prop.kernelExecTimeoutEnabled ? "Yes" : "No") << std::endl;
 #endif
@@ -266,7 +266,7 @@ const char* cublasGetErrorString(cublasStatus_t error) {
     return "CUBLAS_STATUS_INVALID_VALUE";
   case CUBLAS_STATUS_ARCH_MISMATCH:
     return "CUBLAS_STATUS_ARCH_MISMATCH";
-#ifndef __HIPCC__
+#ifndef __HIP_PLATFORM_HCC__
   case CUBLAS_STATUS_MAPPING_ERROR:
     return "CUBLAS_STATUS_MAPPING_ERROR";
   case CUBLAS_STATUS_EXECUTION_FAILED:
@@ -282,7 +282,7 @@ const char* cublasGetErrorString(cublasStatus_t error) {
     return "CUBLAS_STATUS_LICENSE_ERROR";
 #endif  // CUDA_VERSION >= 6050
 #endif  // CUDA_VERSION >= 6000
-#ifdef __HIPCC__
+#ifdef __HIP_PLATFORM_HCC__
   case rocblas_status_invalid_size:
     return "rocblas_status_invalid_size";
 #endif
@@ -319,7 +319,7 @@ const char* curandGetErrorString(curandStatus_t error) {
     return "CURAND_STATUS_ARCH_MISMATCH";
   case CURAND_STATUS_INTERNAL_ERROR:
     return "CURAND_STATUS_INTERNAL_ERROR";
-#ifdef __HIPCC__
+#ifdef __HIP_PLATFORM_HCC__
   case HIPRAND_STATUS_NOT_IMPLEMENTED:
     return "HIPRAND_STATUS_NOT_IMPLEMENTED";
 #endif
 
@@ -282,7 +282,7 @@ CAFFE2_CUDA_API const char* curandGetErrorString(curandStatus_t error);
 // CUDA_KERNEL_ASSERT is a macro that wraps an assert() call inside cuda
 // kernels. This is not supported by Apple platforms so we special case it.
 // See http://docs.nvidia.com/cuda/cuda-c-programming-guide/#assertion
-#if defined(__APPLE__) || defined(__HIPCC__)
+#if defined(__APPLE__) || defined(__HIP_PLATFORM_HCC__)
 #define CUDA_KERNEL_ASSERT(...)
 #else // __APPLE__
 #define CUDA_KERNEL_ASSERT(...) assert(__VA_ARGS__)
 
@@ -3,7 +3,7 @@
 #define CAFFE2_CORE_MIOPEN_WRAPPERS_H_
 
 #include "caffe2/core/hip/common_miopen.h"
-#include "caffe2/core/hip/context_hip.h"
+#include "caffe2/core/hip/context_gpu.h"
 
 namespace caffe2 {
 
 
@@ -6,13 +6,13 @@ set(Caffe2_DB_COMMON_GPU_SRC
     "${CMAKE_CURRENT_SOURCE_DIR}/create_db_op_gpu.cc"
 )
 set(Caffe2_DB_COMMON_HIP_SRC
-    "${CMAKE_CURRENT_SOURCE_DIR}/hip/create_db_op_hip.cc"
+    "${CMAKE_CURRENT_SOURCE_DIR}/hip/create_db_op_gpu.cc"
 )
 
 # Common files that are always going to be included.
 list(APPEND Caffe2_CPU_SRCS ${Caffe2_DB_COMMON_CPU_SRC})
 list(APPEND Caffe2_GPU_SRCS ${Caffe2_DB_COMMON_GPU_SRC})
-list(APPEND Caffe2_HIP_SRCS ${Caffe2_DB_COMMON_HIP_SRC}) 
+list(APPEND Caffe2_HIP_SRCS ${Caffe2_DB_COMMON_HIP_SRC})
 
 # DB specific files
 if (USE_LMDB)
 
@@ -12,13 +12,16 @@ if(USE_OPENCV AND OpenCV_FOUND)
   exclude(Caffe2_GPU_SRCS "${Caffe2_GPU_SRCS}" ${tmp})
 
   # ---[ HIP files
-  # ------[ general hip
-  file(GLOB_RECURSE tmp *_hip.cc)
+  # ------[ general HIP
+  file(GLOB tmp hip/*.cc)
+  set(Caffe2_HIP_SRCS ${Caffe2_HIP_SRCS} ${tmp})
+  # ------[ HIP sources
+  file(GLOB tmp hip/*.hip)
   set(Caffe2_HIP_SRCS ${Caffe2_HIP_SRCS} ${tmp})
   # exclude test files
-  file(GLOB_RECURSE tmp *_test.cc)
+  file(GLOB tmp hip/*_test.cc)
   exclude(Caffe2_HIP_SRCS "${Caffe2_HIP_SRCS}" ${tmp})
-  
+
   # ---[ CPU files.
   file(GLOB tmp *.cc)
   set(Caffe2_CPU_SRCS ${Caffe2_CPU_SRCS} ${tmp})
@@ -33,9 +36,9 @@ if(USE_OPENCV AND OpenCV_FOUND)
   set(Caffe2_GPU_TEST_SRCS ${Caffe2_GPU_TEST_SRCS} ${tmp})
 
   # ---[ HIP test files
-  file(GLOB_RECURSE tmp *_hip_test.cc)
+  file(GLOB tmp hip/*_test.cc)
   set(Caffe2_HIP_TEST_SRCS ${Caffe2_HIP_TEST_SRCS} ${tmp})
-  
+
   # ---[ CPU test files
   file(GLOB tmp *_test.cc)
   set(Caffe2_CPU_TEST_SRCS ${Caffe2_CPU_TEST_SRCS} ${tmp})
 
@@ -23,15 +23,15 @@ set(Caffe2_GPU_SRCS ${Caffe2_GPU_SRCS} ${tmp})
 file(GLOB tmp *_test.cc)
 exclude(Caffe2_GPU_SRCS "${Caffe2_GPU_SRCS}" ${tmp})
 
-# ------[ HIP sources
-file(GLOB_RECURSE tmp *_hip.cc)
-set(Caffe2_HIP_SRCS ${Caffe2_HIP_SRCS} ${tmp})
-# ------[ HIP device sources
-file(GLOB_RECURSE tmp *_hipdev.cc)
+# ------[ general HIP
+file(GLOB tmp hip/*.cc)
 set(Caffe2_HIP_SRCS ${Caffe2_HIP_SRCS} ${tmp})
-# ---[ MIOPEN files
-file(GLOB_RECURSE tmp *_miopen.cc)
+# ------[ HIP sources
+file(GLOB tmp hip/*.hip)
 set(Caffe2_HIP_SRCS ${Caffe2_HIP_SRCS} ${tmp})
+# exclude test files
+file(GLOB tmp hip/*_test.cc)
+exclude(Caffe2_HIP_SRCS "${Caffe2_HIP_SRCS}" ${tmp})
 
 # ---[ CPU files.
 file(GLOB tmp *.cc)
@@ -58,10 +58,7 @@ file(GLOB tmp *_gpu_test.cc)
 set(Caffe2_GPU_TEST_SRCS ${Caffe2_GPU_TEST_SRCS} ${tmp})
 
 # ---[ HIP test files
-file(GLOB_RECURSE tmp *_hip_test.cc)
-set(Caffe2_HIP_TEST_SRCS ${Caffe2_HIP_TEST_SRCS} ${tmp})
-# ---[ MIOPEN test files
-file(GLOB_RECURSE tmp *_miopen_test.cc)
+file(GLOB tmp hip/*_test.cc)
 set(Caffe2_HIP_TEST_SRCS ${Caffe2_HIP_TEST_SRCS} ${tmp})
 
 # ---[ CPU test files
 
@@ -1,7 +1,7 @@
 #ifndef CAFFE2_OPERATORS_ACTIVATION_OPS_MIOPEN_H_
 #define CAFFE2_OPERATORS_ACTIVATION_OPS_MIOPEN_H_
 
-#include "caffe2/core/hip/context_hip.h"
+#include "caffe2/core/hip/context_gpu.h"
 #include "caffe2/core/hip/miopen_wrapper.h"
 #include "caffe2/core/operator.h"
 #include "caffe2/core/tensor.h"
 
@@ -14,7 +14,7 @@
  * limitations under the License.
  */
 
-#include "caffe2/core/hip/context_hip.h"
+#include "caffe2/core/hip/context_gpu.h"
 #include "caffe2/core/hip/miopen_wrapper.h"
 #include "caffe2/operators/conv_op.h"
 #include "caffe2/operators/conv_pool_op_base.h"
 
@@ -1,4 +1,4 @@
-#include "caffe2/core/hip/context_hip.h"
+#include "caffe2/core/hip/context_gpu.h"
 #include "caffe2/core/hip/miopen_wrapper.h"
 #include "caffe2/operators/conv_transpose_op.h"
 
 
@@ -13,7 +13,7 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-#include "caffe2/core/hip/context_hip.h"
+#include "caffe2/core/hip/context_gpu.h"
 #include "caffe2/core/hip/miopen_wrapper.h"
 #include "caffe2/core/operator.h"
 #include "caffe2/core/types.h"
 
@@ -14,7 +14,7 @@
  * limitations under the License.
  */
 
-#include "caffe2/core/hip/context_hip.h"
+#include "caffe2/core/hip/context_gpu.h"
 #include "caffe2/core/hip/miopen_wrapper.h"
 #include "caffe2/operators/conv_pool_op_base.h"
 
 
@@ -15,10 +15,10 @@
  */
 
 #include <cfloat>
-#include "caffe2/core/hip/context_hip.h"
+#include "caffe2/core/hip/context_gpu.h"
 #include "caffe2/core/hip/miopen_wrapper.h"
 #include "caffe2/operators/spatial_batch_norm_op.h"
-#include "caffe2/operators/hip/spatial_batch_norm_op_hip_impl.cuh"
+#include "caffe2/operators/hip/spatial_batch_norm_op_gpu_impl.cuh"
 #include "caffe2/utils/math.h"
 
 const double MIOPEN_BN_MIN_EPSILON = 1e-6;
 
@@ -14,6 +14,16 @@ set(Caffe2_GPU_SRCS ${Caffe2_GPU_SRCS} ${tmp})
 file(GLOB tmp *_test.cc)
 exclude(Caffe2_GPU_SRCS "${Caffe2_GPU_SRCS}" ${tmp})
 
+# ------[ general HIP
+file(GLOB tmp hip/*.cc)
+set(Caffe2_HIP_SRCS ${Caffe2_HIP_SRCS} ${tmp})
+# ------[ HIP sources
+file(GLOB tmp hip/*.hip)
+set(Caffe2_HIP_SRCS ${Caffe2_HIP_SRCS} ${tmp})
+# exclude test files
+file(GLOB tmp hip/*_test.cc)
+exclude(Caffe2_HIP_SRCS "${Caffe2_HIP_SRCS}" ${tmp})
+
 # ---[ CPU files.
 file(GLOB tmp *.cc)
 # Manually remove the cudnn files since we might be using USE_CUDNN=OFF
@@ -24,7 +34,7 @@ set(Caffe2_CPU_SRCS ${Caffe2_CPU_SRCS} ${tmp})
 # exclude test files and gpu files
 file(GLOB tmp *_test.cc)
 exclude(Caffe2_CPU_SRCS "${Caffe2_CPU_SRCS}" ${tmp})
-exclude(Caffe2_CPU_SRCS "${Caffe2_CPU_SRCS}" ${Caffe2_GPU_SRCS})
+exclude(Caffe2_CPU_SRCS "${Caffe2_CPU_SRCS}" ${Caffe2_GPU_SRCS} ${Caffe2_HIP_SRCS})
 
 # ---[ GPU test files
 # ------[ cuDNN
@@ -36,13 +46,19 @@ endif()
 file(GLOB tmp *_gpu_test.cc)
 set(Caffe2_GPU_TEST_SRCS ${Caffe2_GPU_TEST_SRCS} ${tmp})
 
+# ------[ HIP test files
+file(GLOB tmp hip/*_test.cc)
+set(Caffe2_HIP_TEST_SRCS ${Caffe2_HIP_TEST_SRCS} ${tmp})
+
 # ---[ CPU test files
 file(GLOB tmp *_test.cc)
 set(Caffe2_CPU_TEST_SRCS ${Caffe2_CPU_TEST_SRCS} ${tmp})
-exclude(Caffe2_CPU_TEST_SRCS "${Caffe2_CPU_TEST_SRCS}" ${Caffe2_GPU_TEST_SRCS})
+exclude(Caffe2_CPU_TEST_SRCS "${Caffe2_CPU_TEST_SRCS}" ${Caffe2_GPU_TEST_SRCS} ${Caffe2_HIP_TEST_SRCS})
 
 # ---[ Send the lists to the parent scope.
 set(Caffe2_CPU_SRCS ${Caffe2_CPU_SRCS} PARENT_SCOPE)
 set(Caffe2_GPU_SRCS ${Caffe2_GPU_SRCS} PARENT_SCOPE)
+set(Caffe2_HIP_SRCS ${Caffe2_HIP_SRCS} PARENT_SCOPE)
 set(Caffe2_CPU_TEST_SRCS ${Caffe2_CPU_TEST_SRCS} PARENT_SCOPE)
 set(Caffe2_GPU_TEST_SRCS ${Caffe2_GPU_TEST_SRCS} PARENT_SCOPE)
+set(Caffe2_HIP_TEST_SRCS ${Caffe2_HIP_TEST_SRCS} PARENT_SCOPE)
@@ -2,7 +2,7 @@
 #define CAFFE2_OPERATORS_RECURRENT_OP_MIOPEN_H_
 
 #include "caffe2/core/context.h"
-#include "caffe2/core/hip/context_hip.h"
+#include "caffe2/core/hip/context_gpu.h"
 #include "caffe2/core/hip/miopen_wrapper.h"
 #include "caffe2/core/logging.h"
 #include "caffe2/core/operator.h"
 
@@ -6,8 +6,8 @@
 #include <pybind11/stl.h>
 
 #include "caffe2/core/hip/common_miopen.h"
-#include "caffe2/core/hip/context_hip.h"
-#include "caffe2/operators/hip/operator_fallback_hip.h"
+#include "caffe2/core/hip/context_gpu.h"
+#include "caffe2/operators/hip/operator_fallback_gpu.h"
 #include "caffe2/python/pybind_state_registry.h"
 
 namespace caffe2 {
 
@@ -9,11 +9,14 @@ set(Caffe2_GPU_SRCS ${Caffe2_GPU_SRCS} ${tmp})
 file(GLOB tmp *_test.cc)
 exclude(Caffe2_GPU_SRCS "${Caffe2_GPU_SRCS}" ${tmp})
 
+# ------[ general HIP
+file(GLOB tmp hip/*.cc)
+set(Caffe2_HIP_SRCS ${Caffe2_HIP_SRCS} ${tmp})
 # ---[ HIP files.
-file(GLOB_RECURSE tmp *_hip.cc)
+file(GLOB tmp hip/*.hip)
 set(Caffe2_HIP_SRCS ${Caffe2_HIP_SRCS} ${tmp})
 # exclude test files
-file(GLOB tmp *_test.cc)
+file(GLOB tmp hip/*_test.cc)
 exclude(Caffe2_HIP_SRCS "${Caffe2_HIP_SRCS}" ${tmp})
 
 # ---[ CPU files.
@@ -29,7 +32,7 @@ file(GLOB tmp *_gpu_test.cc)
 set(Caffe2_GPU_TEST_SRCS ${Caffe2_GPU_TEST_SRCS} ${tmp})
 
 # ---[ HI test files
-file(GLOB_RECURSE tmp *_hip_test.cc)
+file(GLOB tmp hip/*_test.cc)
 set(Caffe2_HIP_TEST_SRCS ${Caffe2_HIP_TEST_SRCS} ${tmp})
 
 # ---[ CPU test files
@@ -44,4 +47,3 @@ set(Caffe2_HIP_SRCS ${Caffe2_HIP_SRCS} PARENT_SCOPE)
 set(Caffe2_CPU_TEST_SRCS ${Caffe2_CPU_TEST_SRCS} PARENT_SCOPE)
 set(Caffe2_GPU_TEST_SRCS ${Caffe2_GPU_TEST_SRCS} PARENT_SCOPE)
 set(Caffe2_HIP_TEST_SRCS ${Caffe2_HIP_TEST_SRCS} PARENT_SCOPE)
-
Original file line number	Diff line number	Diff line change
`@@ -6,13 +6,13 @@ set(Caffe2_DB_COMMON_GPU_SRC`
`6`	`6`	`"${CMAKE_CURRENT_SOURCE_DIR}/create_db_op_gpu.cc"`
`7`	`7`	`)`
`8`	`8`	`set(Caffe2_DB_COMMON_HIP_SRC`
`9`		`- "${CMAKE_CURRENT_SOURCE_DIR}/hip/create_db_op_hip.cc"`
	`9`	`+ "${CMAKE_CURRENT_SOURCE_DIR}/hip/create_db_op_gpu.cc"`
`10`	`10`	`)`
`11`	`11`
`12`	`12`	`# Common files that are always going to be included.`
`13`	`13`	`list(APPEND Caffe2_CPU_SRCS ${Caffe2_DB_COMMON_CPU_SRC})`
`14`	`14`	`list(APPEND Caffe2_GPU_SRCS ${Caffe2_DB_COMMON_GPU_SRC})`
`15`		`-list(APPEND Caffe2_HIP_SRCS ${Caffe2_DB_COMMON_HIP_SRC})`
	`15`	`+list(APPEND Caffe2_HIP_SRCS ${Caffe2_DB_COMMON_HIP_SRC})`
`16`	`16`
`17`	`17`	`# DB specific files`
`18`	`18`	`if (USE_LMDB)`
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,4 @@`
`1`		`-#include "caffe2/core/hip/context_hip.h"`
	`1`	`+#include "caffe2/core/hip/context_gpu.h"`
`2`	`2`	`#include "caffe2/core/hip/miopen_wrapper.h"`
`3`	`3`	`#include "caffe2/operators/conv_transpose_op.h"`
`4`	`4`