eb8680
diff --git a/‎.jenkins/pytorch/test.sh
Lines changed: 1 addition & 0 deletions b/‎.jenkins/pytorch/test.sh
Lines changed: 1 addition & 0 deletions
diff --git a/‎CMakeLists.txt
Lines changed: 1 addition & 4 deletions b/‎CMakeLists.txt
Lines changed: 1 addition & 4 deletions
diff --git a/‎caffe2/contrib/ideep/CMakeLists.txt
Lines changed: 8 additions & 8 deletions b/‎caffe2/contrib/ideep/CMakeLists.txt
Lines changed: 8 additions & 8 deletions
diff --git a/‎caffe2/contrib/warpctc/ctc_op.cpp
Lines changed: 2 additions & 2 deletions b/‎caffe2/contrib/warpctc/ctc_op.cpp
Lines changed: 2 additions & 2 deletions
diff --git a/‎caffe2/core/macros.h.in
Lines changed: 2 additions & 1 deletion b/‎caffe2/core/macros.h.in
Lines changed: 2 additions & 1 deletion
diff --git a/‎caffe2/ideep/CMakeLists.txt
Lines changed: 8 additions & 8 deletions b/‎caffe2/ideep/CMakeLists.txt
Lines changed: 8 additions & 8 deletions
diff --git a/‎caffe2/operators/atomic_ops.cc
Lines changed: 2 additions & 2 deletions b/‎caffe2/operators/atomic_ops.cc
Lines changed: 2 additions & 2 deletions
diff --git a/‎caffe2/operators/distance_op.cc
Lines changed: 2 additions & 2 deletions b/‎caffe2/operators/distance_op.cc
Lines changed: 2 additions & 2 deletions
diff --git a/‎caffe2/operators/stylizer_ops.cc
Lines changed: 2 additions & 2 deletions b/‎caffe2/operators/stylizer_ops.cc
Lines changed: 2 additions & 2 deletions
diff --git a/‎caffe2/opt/optimize_ideep.cc
Lines changed: 3 additions & 3 deletions b/‎caffe2/opt/optimize_ideep.cc
Lines changed: 3 additions & 3 deletions
diff --git a/‎caffe2/python/CMakeLists.txt
Lines changed: 7 additions & 13 deletions b/‎caffe2/python/CMakeLists.txt
Lines changed: 7 additions & 13 deletions
diff --git a/‎caffe2/python/ideep/LRN_op_test.py
Lines changed: 1 addition & 1 deletion b/‎caffe2/python/ideep/LRN_op_test.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎caffe2/python/ideep/concat_split_op_test.py
Lines changed: 1 addition & 1 deletion b/‎caffe2/python/ideep/concat_split_op_test.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎caffe2/python/ideep/conv_op_test.py
Lines changed: 1 addition & 1 deletion b/‎caffe2/python/ideep/conv_op_test.py
Lines changed: 1 addition & 1 deletion
@@ -109,6 +109,7 @@ test_aten() {
 
     ${SUDO} ln -s "$TORCH_LIB_PATH"/libc10* build/bin
     ${SUDO} ln -s "$TORCH_LIB_PATH"/libcaffe2* build/bin
+    ${SUDO} ln -s "$TORCH_LIB_PATH"/libmkldnn* build/bin
     ${SUDO} ln -s "$TORCH_LIB_PATH"/libnccl* build/bin
 
     ls build/bin
 
@@ -117,8 +117,6 @@ option(USE_TENSORRT "Using Nvidia TensorRT library" OFF)
 option(USE_ZMQ "Use ZMQ" OFF)
 option(USE_ZSTD "Use ZSTD" OFF)
 option(USE_MKLDNN "Use MKLDNN" OFF)
-option(USE_IDEEP "Use IDEEP interface in MKL BLAS" ON)
-option(USE_MKLML "Use MKLML interface in MKL BLAS" ON)
 option(USE_DISTRIBUTED "Use distributed" ON)
 cmake_dependent_option(
     USE_MPI "Use MPI for Caffe2. Only available if USE_DISTRIBUTED is on." ON
@@ -150,8 +148,7 @@ if (BUILD_ATEN_ONLY)
   set(USE_NNPACK OFF)
   set(USE_NUMPY OFF)
   set(USE_OPENCV OFF)
-  set(USE_IDEEP OFF)
-  set(USE_MKLML OFF)
+  set(USE_MKLDNN OFF)
   set(USE_DISTRIBUTED OFF)
   set(USE_LMDB OFF)
 endif()
 
@@ -1,20 +1,20 @@
-if(USE_MKL AND USE_IDEEP AND CAFFE2_COMPILER_SUPPORTS_AVX2_EXTENSIONS)
+if(CAFFE2_USE_MKLDNN)
   message(STATUS "Including IDEEP operators")
 
   # ---[ CPU files.
-  file(GLOB_RECURSE avx2_srcs *.cc)
+  file(GLOB_RECURSE tmp *.cc)
+  set(Caffe2_CPU_SRCS ${Caffe2_CPU_SRCS} ${tmp})
   # exclude test files and gpu files
   file(GLOB_RECURSE tmp *_test.cc)
-  exclude(avx2_srcs "${avx2_srcs}" ${tmp})
+  exclude(Caffe2_CPU_SRCS "${Caffe2_CPU_SRCS}" ${tmp})
 
-  add_library(Caffe2_ideep_operators OBJECT ${avx2_srcs})
-  add_dependencies(Caffe2_ideep_operators Caffe2_PROTO)
-  set_target_properties(Caffe2_ideep_operators PROPERTIES COMPILE_FLAGS "-mavx2")
+  # ---[ CPU test files - currently none but just to be safe
+  file(GLOB_RECURSE tmp *_test.cc)
+  set(Caffe2_CPU_TEST_SRCS ${Caffe2_CPU_TEST_SRCS} ${tmp})
 
   # ---[ Send the lists to the parent scope.
-  set(Caffe2_CPU_SRCS ${Caffe2_CPU_SRCS}
-      $<TARGET_OBJECTS:Caffe2_ideep_operators>)
   set(Caffe2_CPU_SRCS ${Caffe2_CPU_SRCS} PARENT_SCOPE)
+  set(Caffe2_CPU_TEST_SRCS ${Caffe2_CPU_TEST_SRCS} PARENT_SCOPE)
 else()
   message(STATUS "Excluding ideep operators as we are not using ideep")
 endif()
@@ -2,7 +2,7 @@
 #include "caffe2/core/context_gpu.h"
 #include "caffe2/core/operator.h"
 
-#ifdef CAFFE2_USE_IDEEP
+#ifdef CAFFE2_USE_MKLDNN
 #include <caffe2/ideep/operators/operator_fallback_ideep.h>
 #include <caffe2/ideep/utils/ideep_operator.h>
 #endif
@@ -25,7 +25,7 @@ REGISTER_CPU_OPERATOR(CTC, CTCOp<float, CPUContext>);
 OPERATOR_SCHEMA(CTC).NumInputs(3, 4).NumOutputs(2, 3);
 //    .EnforceInputOutputGradient({{0, 0}});
 
-#ifdef CAFFE2_USE_IDEEP
+#ifdef CAFFE2_USE_MKLDNN
 REGISTER_IDEEP_OPERATOR(CTC, IDEEPFallbackOp<CTCOp<float, CPUContext>>);
 #endif
 
 
@@ -40,7 +40,7 @@ static_assert(
 #cmakedefine CAFFE2_USE_GOOGLE_GLOG
 #cmakedefine CAFFE2_USE_LITE_PROTO
 #cmakedefine CAFFE2_USE_MKL
-#cmakedefine CAFFE2_USE_IDEEP
+#cmakedefine CAFFE2_USE_MKLDNN
 #cmakedefine CAFFE2_USE_NVTX
 #cmakedefine CAFFE2_USE_TRT
 #cmakedefine CAFFE2_DISABLE_NUMA
@@ -76,6 +76,7 @@ static_assert(
   {"USE_EIGEN_FOR_BLAS", "${CAFFE2_USE_EIGEN_FOR_BLAS}"}, \
   {"USE_LITE_PROTO", "${CAFFE2_USE_LITE_PROTO}"}, \
   {"USE_MKL", "${CAFFE2_USE_MKL}"}, \
+  {"USE_MKLDNN", "${CAFFE2_USE_MKLDNN}"}, \
   {"USE_NVTX", "${CAFFE2_USE_NVTX}"}, \
   {"USE_TRT", "${CAFFE2_USE_TRT}"}, \
   {"DISABLE_NUMA", "${CAFFE2_DISABLE_NUMA}"}, \
 
@@ -1,20 +1,20 @@
-if(USE_MKL AND USE_IDEEP AND CAFFE2_COMPILER_SUPPORTS_AVX2_EXTENSIONS)
+if(CAFFE2_USE_MKLDNN)
   message(STATUS "Including IDEEP operators")
 
   # ---[ CPU files.
-  file(GLOB_RECURSE avx2_srcs *.cc)
+  file(GLOB_RECURSE tmp *.cc)
+  set(Caffe2_CPU_SRCS ${Caffe2_CPU_SRCS} ${tmp})
   # exclude test files and gpu files
   file(GLOB_RECURSE tmp *_test.cc)
-  exclude(avx2_srcs "${avx2_srcs}" ${tmp})
+  exclude(Caffe2_CPU_SRCS "${Caffe2_CPU_SRCS}" ${tmp})
 
-  add_library(Caffe2_ideep_operators OBJECT ${avx2_srcs})
-  add_dependencies(Caffe2_ideep_operators Caffe2_PROTO)
-  set_target_properties(Caffe2_ideep_operators PROPERTIES COMPILE_FLAGS "-mavx2")
+  # ---[ CPU test files - currently none but just to be safe
+  file(GLOB_RECURSE tmp *_test.cc)
+  set(Caffe2_CPU_TEST_SRCS ${Caffe2_CPU_TEST_SRCS} ${tmp})
 
   # ---[ Send the lists to the parent scope.
-  set(Caffe2_CPU_SRCS ${Caffe2_CPU_SRCS}
-      $<TARGET_OBJECTS:Caffe2_ideep_operators>)
   set(Caffe2_CPU_SRCS ${Caffe2_CPU_SRCS} PARENT_SCOPE)
+  set(Caffe2_CPU_TEST_SRCS ${Caffe2_CPU_TEST_SRCS} PARENT_SCOPE)
 else()
   message(STATUS "Excluding ideep operators as we are not using ideep")
 endif()
@@ -2,7 +2,7 @@
 #include "caffe2/core/context.h"
 #include "caffe2/core/operator.h"
 
-#ifdef CAFFE2_USE_IDEEP
+#ifdef CAFFE2_USE_MKLDNN
 #include <caffe2/ideep/operators/operator_fallback_ideep.h>
 #include <caffe2/ideep/utils/ideep_operator.h>
 #endif
@@ -90,7 +90,7 @@ class CheckAtomicBoolOp final : public Operator<CPUContext> {
 REGISTER_CPU_OPERATOR(CreateMutex, CreateMutexOp);
 REGISTER_CPU_OPERATOR(AtomicFetchAdd, AtomicFetchAddOp);
 
-#ifdef CAFFE2_USE_IDEEP
+#ifdef CAFFE2_USE_MKLDNN
 REGISTER_IDEEP_OPERATOR(CreateMutex, IDEEPFallbackOp<CreateMutexOp, SkipIndices<0>>);
 #endif
 
 
@@ -1,6 +1,6 @@
 #include "caffe2/operators/distance_op.h"
 #include "caffe2/utils/eigen_utils.h"
-#ifdef CAFFE2_USE_IDEEP
+#ifdef CAFFE2_USE_MKLDNN
 #include <caffe2/ideep/operators/operator_fallback_ideep.h>
 #include <caffe2/ideep/utils/ideep_operator.h>
 #endif
@@ -400,7 +400,7 @@ REGISTER_CPU_OPERATOR(L1Distance, L1DistanceOp<float, CPUContext>);
 REGISTER_CPU_OPERATOR(
     L1DistanceGradient,
     L1DistanceGradientOp<float, CPUContext>);
-#ifdef CAFFE2_USE_IDEEP
+#ifdef CAFFE2_USE_MKLDNN
 REGISTER_IDEEP_OPERATOR(
     L1DistanceGradient,
     IDEEPFallbackOp<L1DistanceGradientOp<float, CPUContext>>);
 
@@ -2,7 +2,7 @@
 #include "caffe2/utils/cpu_neon.h"
 #include "caffe2/utils/math.h"
 
-#ifdef CAFFE2_USE_IDEEP
+#ifdef CAFFE2_USE_MKLDNN
 #include <caffe2/ideep/operators/operator_fallback_ideep.h>
 #include <caffe2/ideep/utils/ideep_operator.h>
 #endif
@@ -586,7 +586,7 @@ OPERATOR_SCHEMA(BRGNCHWCToPackedInt8BGRAStylizerDeprocess)
     .NumInputs(2)
     .NumOutputs(1);
 
-#ifdef CAFFE2_USE_IDEEP
+#ifdef CAFFE2_USE_MKLDNN
 REGISTER_IDEEP_OPERATOR(
     BRGNCHWCToPackedInt8BGRAStylizerDeprocess,
     IDEEPFallbackOp<BRGNCHWCToPackedInt8BGRAStylizerDeprocessOp, SkipIndices<0>>);
 
@@ -2,7 +2,7 @@
 #include "caffe2/opt/converter.h"
 #include "caffe2/opt/fusion.h"
 
-#ifdef CAFFE2_USE_IDEEP
+#ifdef CAFFE2_USE_MKLDNN
 #include "caffe2/ideep/ideep_utils.h"
 #endif
 
@@ -11,7 +11,7 @@ namespace opt {
 
 using namespace nom;
 
-#ifndef CAFFE2_USE_IDEEP
+#ifndef CAFFE2_USE_MKLDNN
 void OptimizeForIdeep(
     repr::NNModule* nn,
     caffe2::Workspace* ws,
@@ -440,7 +440,7 @@ void OptimizeForIdeep(
   setPoolingInferenceMode(nn);
 }
 
-#endif // CAFFE2_USE_IDEEP
+#endif // CAFFE2_USE_MKLDNN
 
 } // namespace opt
 } // namespace caffe2
@@ -6,6 +6,13 @@ set(Caffe2_CPU_PYTHON_SRCS
     "/pybind_state_registry.cc"
 )
 
+if(CAFFE2_USE_MKLDNN)
+  set(Caffe2_CPU_PYTHON_SRCS
+      ${Caffe2_CPU_PYTHON_SRCS}
+      "/pybind_state_ideep.cc"
+  )
+endif()
+
 # ---[ GPU files
 set(Caffe2_GPU_PYTHON_SRCS
     ${Caffe2_CPU_PYTHON_SRCS}
@@ -22,19 +29,6 @@ prepend(Caffe2_CPU_PYTHON_SRCS ${CMAKE_CURRENT_SOURCE_DIR} ${Caffe2_CPU_PYTHON_S
 prepend(Caffe2_GPU_PYTHON_SRCS ${CMAKE_CURRENT_SOURCE_DIR} ${Caffe2_GPU_PYTHON_SRCS})
 prepend(Caffe2_HIP_PYTHON_SRCS ${CMAKE_CURRENT_SOURCE_DIR} ${Caffe2_HIP_PYTHON_SRCS})
 
-
-# --[ Some special handling for ideep binding as we need to build with "-mavx2"
-if(USE_MKL AND USE_IDEEP AND CAFFE2_COMPILER_SUPPORTS_AVX2_EXTENSIONS)
-  file(GLOB_RECURSE ideep_srcs *_ideep.cc)
-  add_library(Caffe2_ideep_pybind OBJECT ${ideep_srcs})
-  add_dependencies(Caffe2_ideep_pybind Caffe2_PROTO)
-  set_target_properties(Caffe2_ideep_pybind PROPERTIES COMPILE_FLAGS "-mavx2")
-  set(Caffe2_CPU_PYTHON_SRCS
-      ${Caffe2_CPU_PYTHON_SRCS}
-      $<TARGET_OBJECTS:Caffe2_ideep_pybind>
-  )
-endif()
-
 set(Caffe2_CPU_PYTHON_SRCS ${Caffe2_CPU_PYTHON_SRCS} PARENT_SCOPE)
 set(Caffe2_GPU_PYTHON_SRCS ${Caffe2_GPU_PYTHON_SRCS} PARENT_SCOPE)
 set(Caffe2_HIP_PYTHON_SRCS ${Caffe2_HIP_PYTHON_SRCS} PARENT_SCOPE)
 
@@ -12,7 +12,7 @@
 import caffe2.python.ideep_test_util as mu
 
 
-@unittest.skipIf(not workspace.C.use_ideep, "No IDEEP support.")
+@unittest.skipIf(not workspace.C.use_mkldnn, "No MKLDNN support.")
 class LRNTest(hu.HypothesisTestCase):
     @given(input_channels=st.integers(1, 3),
            batch_size=st.integers(1, 3),
 
@@ -45,7 +45,7 @@ def _tensor_splits(draw, add_axis=False):
         )
 
 
-@unittest.skipIf(not workspace.C.use_ideep, "No IDEEP support.")
+@unittest.skipIf(not workspace.C.use_mkldnn, "No MKLDNN support.")
 class TestConcatSplitOps(hu.HypothesisTestCase):
     @given(tensor_splits=_tensor_splits(),
            **mu.gcs)
 
@@ -14,7 +14,7 @@
 import caffe2.python.ideep_test_util as mu
 
 
-@unittest.skipIf(not workspace.C.use_ideep, "No IDEEP support.")
+@unittest.skipIf(not workspace.C.use_mkldnn, "No MKLDNN support.")
 class ConvTest(hu.HypothesisTestCase):
     @given(stride=st.integers(1, 3),
            pad=st.integers(0, 3),
Original file line number	Diff line number	Diff line change
`@@ -45,7 +45,7 @@ def _tensor_splits(draw, add_axis=False):`
`45`	`45`	`)`
`46`	`46`
`47`	`47`
`48`		`-@unittest.skipIf(not workspace.C.use_ideep, "No IDEEP support.")`
	`48`	`+@unittest.skipIf(not workspace.C.use_mkldnn, "No MKLDNN support.")`
`49`	`49`	`class TestConcatSplitOps(hu.HypothesisTestCase):`
`50`	`50`	`@given(tensor_splits=_tensor_splits(),`
`51`	`51`	`**mu.gcs)`