Review fix

JanuszL · JanuszL · commit 74a6e5a3cdfa · 2024-06-04T15:44:20.000+02:00
Signed-off-by: Janusz Lisiecki &lt;jlisiecki@nvidia.com&gt;
diff --git a/docs/examples/custom_operations/custom_operator/create_a_custom_operator.ipynb b/docs/examples/custom_operations/custom_operator/create_a_custom_operator.ipynb
@@ -43,47 +43,47 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "#ifndef EXAMPLE_DUMMY_H_\r\n",
-      "#define EXAMPLE_DUMMY_H_\r\n",
-      "\r\n",
-      "#include <vector>\r\n",
-      "\r\n",
-      "#include \"dali/pipeline/operator/operator.h\"\r\n",
-      "\r\n",
-      "namespace other_ns {\r\n",
-      "\r\n",
-      "template <typename Backend>\r\n",
-      "class Dummy : public ::dali::Operator<Backend> {\r\n",
-      " public:\r\n",
-      "  inline explicit Dummy(const ::dali::OpSpec &spec) :\r\n",
-      "    ::dali::Operator<Backend>(spec) {}\r\n",
-      "\r\n",
-      "  virtual inline ~Dummy() = default;\r\n",
-      "\r\n",
-      "  Dummy(const Dummy&) = delete;\r\n",
-      "  Dummy& operator=(const Dummy&) = delete;\r\n",
-      "  Dummy(Dummy&&) = delete;\r\n",
-      "  Dummy& operator=(Dummy&&) = delete;\r\n",
-      "\r\n",
-      " protected:\r\n",
-      "  bool CanInferOutputs() const override {\r\n",
-      "    return true;\r\n",
-      "  }\r\n",
-      "\r\n",
-      "  bool SetupImpl(std::vector<::dali::OutputDesc> &output_desc,\r\n",
-      "                 const ::dali::Workspace &ws) override {\r\n",
-      "    const auto &input = ws.Input<Backend>(0);\r\n",
-      "    output_desc.resize(1);\r\n",
-      "    output_desc[0] = {input.shape(), input.type()};\r\n",
-      "    return true;\r\n",
-      "  }\r\n",
-      "\r\n",
-      "  void RunImpl(::dali::Workspace &ws) override;\r\n",
-      "};\r\n",
-      "\r\n",
-      "}  // namespace other_ns\r\n",
-      "\r\n",
-      "#endif  // EXAMPLE_DUMMY_H_\r\n"
+      "#ifndef EXAMPLE_DUMMY_H_\n",
+      "#define EXAMPLE_DUMMY_H_\n",
+      "\n",
+      "#include <vector>\n",
+      "\n",
+      "#include \"dali/pipeline/operator/operator.h\"\n",
+      "\n",
+      "namespace other_ns {\n",
+      "\n",
+      "template <typename Backend>\n",
+      "class Dummy : public ::dali::Operator<Backend> {\n",
+      " public:\n",
+      "  inline explicit Dummy(const ::dali::OpSpec &spec) :\n",
+      "    ::dali::Operator<Backend>(spec) {}\n",
+      "\n",
+      "  virtual inline ~Dummy() = default;\n",
+      "\n",
+      "  Dummy(const Dummy&) = delete;\n",
+      "  Dummy& operator=(const Dummy&) = delete;\n",
+      "  Dummy(Dummy&&) = delete;\n",
+      "  Dummy& operator=(Dummy&&) = delete;\n",
+      "\n",
+      " protected:\n",
+      "  bool CanInferOutputs() const override {\n",
+      "    return true;\n",
+      "  }\n",
+      "\n",
+      "  bool SetupImpl(std::vector<::dali::OutputDesc> &output_desc,\n",
+      "                 const ::dali::Workspace &ws) override {\n",
+      "    const auto &input = ws.Input<Backend>(0);\n",
+      "    output_desc.resize(1);\n",
+      "    output_desc[0] = {input.shape(), input.type()};\n",
+      "    return true;\n",
+      "  }\n",
+      "\n",
+      "  void RunImpl(::dali::Workspace &ws) override;\n",
+      "};\n",
+      "\n",
+      "}  // namespace other_ns\n",
+      "\n",
+      "#endif  // EXAMPLE_DUMMY_H_\n"
      ]
     }
    ],
@@ -115,40 +115,40 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "#include \"dummy.h\"\r\n",
-      "\r\n",
-      "namespace other_ns {\r\n",
-      "\r\n",
-      "template <>\r\n",
-      "void Dummy<::dali::CPUBackend>::RunImpl(::dali::Workspace &ws) {\r\n",
-      "  const auto &input = ws.Input<::dali::CPUBackend>(0);\r\n",
-      "  auto &output = ws.Output<::dali::CPUBackend>(0);\r\n",
-      "\r\n",
-      "  ::dali::TypeInfo type = input.type_info();\r\n",
-      "  auto &tp = ws.GetThreadPool();\r\n",
-      "  const auto &in_shape = input.shape();\r\n",
-      "  for (int sample_id = 0; sample_id < in_shape.num_samples(); sample_id++) {\r\n",
-      "    tp.AddWork(\r\n",
-      "        [&, sample_id](int thread_id) {\r\n",
-      "          type.Copy<::dali::CPUBackend, ::dali::CPUBackend>(\r\n",
-      "                            output.raw_mutable_tensor(sample_id),\r\n",
-      "                            input.raw_tensor(sample_id),\r\n",
-      "                            in_shape.tensor_size(sample_id), 0);\r\n",
-      "        },\r\n",
-      "        in_shape.tensor_size(sample_id));\r\n",
-      "  }\r\n",
-      "  tp.RunAll();\r\n",
-      "}\r\n",
-      "\r\n",
-      "}  // namespace other_ns\r\n",
-      "\r\n",
-      "DALI_REGISTER_OPERATOR(CustomDummy, ::other_ns::Dummy<::dali::CPUBackend>,\r\n",
-      "                       ::dali::CPU);\r\n",
-      "\r\n",
-      "DALI_SCHEMA(CustomDummy)\r\n",
-      "    .DocStr(\"Make a copy of the input tensor\")\r\n",
-      "    .NumInput(1)\r\n",
-      "    .NumOutput(1);\r\n"
+      "#include \"dummy.h\"\n",
+      "\n",
+      "namespace other_ns {\n",
+      "\n",
+      "template <>\n",
+      "void Dummy<::dali::CPUBackend>::RunImpl(::dali::Workspace &ws) {\n",
+      "  const auto &input = ws.Input<::dali::CPUBackend>(0);\n",
+      "  auto &output = ws.Output<::dali::CPUBackend>(0);\n",
+      "\n",
+      "  ::dali::TypeInfo type = input.type_info();\n",
+      "  auto &tp = ws.GetThreadPool();\n",
+      "  const auto &in_shape = input.shape();\n",
+      "  for (int sample_id = 0; sample_id < in_shape.num_samples(); sample_id++) {\n",
+      "    tp.AddWork(\n",
+      "        [&, sample_id](int thread_id) {\n",
+      "          type.Copy<::dali::CPUBackend, ::dali::CPUBackend>(\n",
+      "                            output.raw_mutable_tensor(sample_id),\n",
+      "                            input.raw_tensor(sample_id),\n",
+      "                            in_shape.tensor_size(sample_id), 0);\n",
+      "        },\n",
+      "        in_shape.tensor_size(sample_id));\n",
+      "  }\n",
+      "  tp.RunAll();\n",
+      "}\n",
+      "\n",
+      "}  // namespace other_ns\n",
+      "\n",
+      "DALI_REGISTER_OPERATOR(CustomDummy, ::other_ns::Dummy<::dali::CPUBackend>,\n",
+      "                       ::dali::CPU);\n",
+      "\n",
+      "DALI_SCHEMA(CustomDummy)\n",
+      "    .DocStr(\"Make a copy of the input tensor\")\n",
+      "    .NumInput(1)\n",
+      "    .NumOutput(1);\n"
      ]
     }
    ],
@@ -180,30 +180,30 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "#include <cuda_runtime_api.h>\r\n",
-      "#include \"dummy.h\"\r\n",
-      "\r\n",
-      "namespace other_ns {\r\n",
-      "\r\n",
-      "template<>\r\n",
-      "void Dummy<::dali::GPUBackend>::RunImpl(::dali::Workspace &ws) {\r\n",
-      "  const auto &input = ws.Input<::dali::GPUBackend>(0);\r\n",
-      "  const auto &shape = input.shape();\r\n",
-      "  auto &output = ws.Output<::dali::GPUBackend>(0);\r\n",
-      "  for (int sample_idx = 0; sample_idx < shape.num_samples(); sample_idx++) {\r\n",
-      "    CUDA_CALL(cudaMemcpyAsync(\r\n",
-      "            output.raw_mutable_tensor(sample_idx),\r\n",
-      "            input.raw_tensor(sample_idx),\r\n",
-      "            shape[sample_idx].num_elements() * input.type_info().size(),\r\n",
-      "            cudaMemcpyDeviceToDevice,\r\n",
-      "            ws.stream()));\r\n",
-      "  }\r\n",
-      "}\r\n",
-      "\r\n",
-      "}  // namespace other_ns\r\n",
-      "\r\n",
-      "DALI_REGISTER_OPERATOR(CustomDummy, ::other_ns::Dummy<::dali::GPUBackend>,\r\n",
-      "                       ::dali::GPU);\r\n"
+      "#include <cuda_runtime_api.h>\n",
+      "#include \"dummy.h\"\n",
+      "\n",
+      "namespace other_ns {\n",
+      "\n",
+      "template<>\n",
+      "void Dummy<::dali::GPUBackend>::RunImpl(::dali::Workspace &ws) {\n",
+      "  const auto &input = ws.Input<::dali::GPUBackend>(0);\n",
+      "  const auto &shape = input.shape();\n",
+      "  auto &output = ws.Output<::dali::GPUBackend>(0);\n",
+      "  for (int sample_idx = 0; sample_idx < shape.num_samples(); sample_idx++) {\n",
+      "    CUDA_CALL(cudaMemcpyAsync(\n",
+      "            output.raw_mutable_tensor(sample_idx),\n",
+      "            input.raw_tensor(sample_idx),\n",
+      "            shape[sample_idx].num_elements() * input.type_info().size(),\n",
+      "            cudaMemcpyDeviceToDevice,\n",
+      "            ws.stream()));\n",
+      "  }\n",
+      "}\n",
+      "\n",
+      "}  // namespace other_ns\n",
+      "\n",
+      "DALI_REGISTER_OPERATOR(CustomDummy, ::other_ns::Dummy<::dali::GPUBackend>,\n",
+      "                       ::dali::GPU);\n"
      ]
     }
    ],
@@ -239,7 +239,7 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "/home/jlisiecki/Dali/dali/compile/dali/python/nvidia/dali/include\n"
+      "/usr/local/lib/python3.8/dist-packages/nvidia/dali/include\n"
      ]
     }
    ],
@@ -256,7 +256,7 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "/home/jlisiecki/Dali/dali/compile/dali/python/nvidia/dali\n"
+      "/usr/local/lib/python3.8/dist-packages/nvidia/dali\n"
      ]
     }
    ],
@@ -273,7 +273,7 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "['-I/home/jlisiecki/Dali/dali/compile/dali/python/nvidia/dali/include', '-D_GLIBCXX_USE_CXX11_ABI=1']\n"
+      "['-I/usr/local/lib/python3.8/dist-packages/nvidia/dali/include', '-D_GLIBCXX_USE_CXX11_ABI=1']\n"
      ]
     }
    ],
@@ -290,7 +290,7 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "['-L/home/jlisiecki/Dali/dali/compile/dali/python/nvidia/dali', '-ldali']\n"
+      "['-L/usr/local/lib/python3.8/dist-packages/nvidia/dali', '-ldali']\n"
      ]
     }
    ],
@@ -317,42 +317,42 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "cmake_minimum_required(VERSION 3.10)\r\n",
-      "set(CMAKE_CUDA_ARCHITECTURES \"50;60;70;80;90\")\r\n",
-      "\r\n",
-      "project(custom_dummy_plugin LANGUAGES CUDA CXX C)\r\n",
-      "\r\n",
-      "set(CMAKE_CXX_STANDARD 17)\r\n",
-      "set(CMAKE_CXX_STANDARD_REQUIRED ON)\r\n",
-      "set(CMAKE_CXX_EXTENSIONS OFF)\r\n",
-      "set(CMAKE_C_STANDARD 11)\r\n",
-      "\r\n",
-      "# TODO(klecki): When the test container gets a CMake that supports C++17 as a proper option,\r\n",
-      "# swap those lines\r\n",
-      "# set(CMAKE_CUDA_STANDARD 17)\r\n",
-      "# set(CMAKE_CUDA_STANDARD_REQUIRED ON)\r\n",
-      "set(CMAKE_CUDA_FLAGS \"${CMAKE_CUDA_FLAGS} -std=c++17\")\r\n",
-      "\r\n",
-      "include_directories(SYSTEM \"${CMAKE_CUDA_TOOLKIT_INCLUDE_DIRECTORIES}\")\r\n",
-      "\r\n",
-      "execute_process(\r\n",
-      "        COMMAND python -c \"import nvidia.dali as dali; \\\r\n",
-      "                           print(dali.sysconfig.get_lib_dir())\"\r\n",
-      "        OUTPUT_VARIABLE DALI_LIB_DIR)\r\n",
-      "string(STRIP ${DALI_LIB_DIR} DALI_LIB_DIR)\r\n",
-      "\r\n",
-      "execute_process(\r\n",
-      "        COMMAND python -c \"import nvidia.dali as dali; print(\\\" \\\r\n",
-      "                          \\\".join(dali.sysconfig.get_compile_flags()))\"\r\n",
-      "        OUTPUT_VARIABLE DALI_COMPILE_FLAGS)\r\n",
-      "string(STRIP ${DALI_COMPILE_FLAGS} DALI_COMPILE_FLAGS)\r\n",
-      "\r\n",
-      "set(CMAKE_CXX_FLAGS \"${CMAKE_CXX_FLAGS} ${DALI_COMPILE_FLAGS} \")\r\n",
-      "set(CMAKE_CUDA_FLAGS \"${CMAKE_CUDA_FLAGS} ${DALI_COMPILE_FLAGS} \")\r\n",
-      "link_directories(\"${DALI_LIB_DIR}\")\r\n",
-      "\r\n",
-      "add_library(dali_customdummy SHARED dummy.cc dummy.cu)\r\n",
-      "target_link_libraries(dali_customdummy dali)\r\n"
+      "cmake_minimum_required(VERSION 3.10)\n",
+      "set(CMAKE_CUDA_ARCHITECTURES \"50;60;70;80;90\")\n",
+      "\n",
+      "project(custom_dummy_plugin LANGUAGES CUDA CXX C)\n",
+      "\n",
+      "set(CMAKE_CXX_STANDARD 17)\n",
+      "set(CMAKE_CXX_STANDARD_REQUIRED ON)\n",
+      "set(CMAKE_CXX_EXTENSIONS OFF)\n",
+      "set(CMAKE_C_STANDARD 11)\n",
+      "\n",
+      "# TODO(klecki): When the test container gets a CMake that supports C++17 as a proper option,\n",
+      "# swap those lines\n",
+      "# set(CMAKE_CUDA_STANDARD 17)\n",
+      "# set(CMAKE_CUDA_STANDARD_REQUIRED ON)\n",
+      "set(CMAKE_CUDA_FLAGS \"${CMAKE_CUDA_FLAGS} -std=c++17\")\n",
+      "\n",
+      "include_directories(SYSTEM \"${CMAKE_CUDA_TOOLKIT_INCLUDE_DIRECTORIES}\")\n",
+      "\n",
+      "execute_process(\n",
+      "        COMMAND python -c \"import nvidia.dali as dali; \\\n",
+      "                           print(dali.sysconfig.get_lib_dir())\"\n",
+      "        OUTPUT_VARIABLE DALI_LIB_DIR)\n",
+      "string(STRIP ${DALI_LIB_DIR} DALI_LIB_DIR)\n",
+      "\n",
+      "execute_process(\n",
+      "        COMMAND python -c \"import nvidia.dali as dali; print(\\\" \\\n",
+      "                          \\\".join(dali.sysconfig.get_compile_flags()))\"\n",
+      "        OUTPUT_VARIABLE DALI_COMPILE_FLAGS)\n",
+      "string(STRIP ${DALI_COMPILE_FLAGS} DALI_COMPILE_FLAGS)\n",
+      "\n",
+      "set(CMAKE_CXX_FLAGS \"${CMAKE_CXX_FLAGS} ${DALI_COMPILE_FLAGS} \")\n",
+      "set(CMAKE_CUDA_FLAGS \"${CMAKE_CUDA_FLAGS} ${DALI_COMPILE_FLAGS} \")\n",
+      "link_directories(\"${DALI_LIB_DIR}\")\n",
+      "\n",
+      "add_library(dali_customdummy SHARED dummy.cc dummy.cu)\n",
+      "target_link_libraries(dali_customdummy dali)\n"
      ]
     }
    ],
@@ -376,9 +376,9 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "-- The CUDA compiler identification is NVIDIA 12.5.40\n",
-      "-- The CXX compiler identification is GNU 12.3.0\n",
-      "-- The C compiler identification is GNU 12.3.0\n",
+      "-- The CUDA compiler identification is NVIDIA 12.4.131\n",
+      "-- The CXX compiler identification is GNU 9.4.0\n",
+      "-- The C compiler identification is GNU 9.4.0\n",
       "-- Detecting CUDA compiler ABI info\n",
       "-- Detecting CUDA compiler ABI info - done\n",
       "-- Check for working CUDA compiler: /usr/local/cuda/bin/nvcc - skipped\n",
@@ -394,9 +394,9 @@
       "-- Check for working C compiler: /usr/bin/cc - skipped\n",
       "-- Detecting C compile features\n",
       "-- Detecting C compile features - done\n",
-      "-- Configuring done (6.0s)\n",
+      "-- Configuring done (5.2s)\n",
       "-- Generating done (0.0s)\n",
-      "-- Build files have been written to: /home/jlisiecki/Dali/dali/docs/examples/custom_operations/custom_operator/customdummy/build\n",
+      "-- Build files have been written to: /dali/docs/examples/custom_operations/custom_operator/customdummy/build\n",
       "[ 33%] \u001b[32mBuilding CXX object CMakeFiles/dali_customdummy.dir/dummy.cc.o\u001b[0m\n",
       "[ 66%] \u001b[32mBuilding CUDA object CMakeFiles/dali_customdummy.dir/dummy.cu.o\u001b[0m\n",
       "[100%] \u001b[32m\u001b[1mLinking CXX shared library libdali_customdummy.so\u001b[0m\n",
@@ -428,7 +428,7 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "customdummy/build/libdali_customdummy.so\r\n"
+      "customdummy/build/libdali_customdummy.so\n"
      ]
     }
    ],
@@ -574,7 +574,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.10.12"
+   "version": "3.8.10"
   }
  },
  "nbformat": 4,