Added doc and removed upImpl in poseExtractor

dabd713b · gineshidalgo99 · 99855c6a · dabd713b · dabd713b · dabd713b
7 changed file
--- a/.travis.yml
+++ b/.travis.yml
@@ -22,6 +22,11 @@ matrix:
  #   WITH_MKL: false
  include:
  # Ubuntu 16.04
+  # Ubuntu 16.04 - Default - CMake - CUDA
+  - os: linux
+    dist: xenial
+    env: NAME="U16-default-cmake-cuda8"
+    sudo: required
  # Ubuntu 16.04 - Python - CMake - CUDA
  - os: linux
    dist: xenial
@@ -37,15 +42,10 @@ matrix:
    dist: xenial
    env: NAME="U16-python-cmake-cpu" WITH_PYTHON=true WITH_CUDA=false
    sudo: required
-  # Ubuntu 16.04 - Default - CMake - CUDA
+  # Ubuntu 16.04 - Python - CMake - OpenCL
  - os: linux
    dist: xenial
-    env: NAME="U16-default-cmake-cuda8"
-    sudo: required
-  # Ubuntu 16.04 - Default - CMake - CPU
-  - os: linux
-    dist: xenial
-    env: NAME="U16-default-cmake-cpu" WITH_CUDA=false
+    env: NAME="U16-python-cmake-opencl" WITH_PYTHON=true WITH_CUDA=false WITH_OPEN_CL=true
    sudo: required
  # Ubuntu 16.04 - Python - CMake - CPU - Debug
  - os: linux
@@ -64,10 +64,10 @@ matrix:
    osx_image: xcode9.4 # xcode10.1 does not work with Python # Versions: https://docs.travis-ci.com/user/languages/objective-c#supported-xcode-versions
    env: NAME="OSX-python-cmake-cpu" WITH_CUDA=false WITH_PYTHON=true
    sudo: required
-  # Mac OSX - Default - CMake - CPU
+  # Mac OSX - Python - CMake - OpenCL
  - os: osx
    osx_image: xcode10.1 # Versions: https://docs.travis-ci.com/user/languages/objective-c#supported-xcode-versions
-    env: NAME="OSX-default-cmake-cpu" WITH_CUDA=false
+    env: NAME="OSX-default-cmake-opencl" WITH_CUDA=false WITH_OPEN_CL=true
    sudo: required
  # Mac OSX - Python - CMake - CPU - Debug
  - os: osx
@@ -79,10 +79,10 @@ matrix:
    osx_image: xcode9.4 # xcode10.1 does not work with Python # Versions: https://docs.travis-ci.com/user/languages/objective-c#supported-xcode-versions
    env: NAME="OSX-python-cmake-cpu-unity" WITH_CUDA=false WITH_PYTHON=true WITH_UNITY=true
    sudo: required
-  # Mac OSX - Default - CMake - OpenCL
+  # Mac OSX - Default - CMake - CPU
  - os: osx
    osx_image: xcode10.1 # Versions: https://docs.travis-ci.com/user/languages/objective-c#supported-xcode-versions
-    env: NAME="OSX-default-cmake-opencl" WITH_CUDA=false WITH_OPEN_CL=true
+    env: NAME="OSX-default-cmake-cpu" WITH_CUDA=false
    sudo: required

  # # TO-DO: To be implemented
@@ -92,6 +92,11 @@ matrix:
  #   env: NAME="W10-default-cmake-cuda8"

  # Ubuntu (others)
+  # Ubuntu 16.04 - Default - CMake - CPU
+  - os: linux
+    dist: xenial
+    env: NAME="U16-default-cmake-cpu" WITH_CUDA=false
+    sudo: required
  # Ubuntu 16.04 - Default - Make - CUDA
  - os: linux
    dist: xenial
@@ -103,11 +108,6 @@ matrix:
  #   dist: xenial
  #   env: NAME="U16-default-cmake-cpu-mkl" WITH_CUDA=false WITH_MKL=true
  #   sudo: required
-  # Ubuntu 16.04 - Default - CMake - OpenCL
-  - os: linux
-    dist: xenial
-    env: NAME="U16-default-cmake-opencl" WITH_CUDA=false WITH_OPEN_CL=true
-    sudo: required
  # # Ubuntu 16.04 - Python - CMake - OpenCL
  # - os: linux
  #   dist: xenial

--- a/README.md
+++ b/README.md
@@ -4,10 +4,10 @@

 -----------------

-|               |`Python (CUDA)`| `Python (CPU)`| `CUDA`        | `CPU`         | `Debug`       | `Unity`       |
-| :---:         | :---:         | :---:         | :---:         | :---:         | :---:         | :---:         |
+|                  |`Default Config`  |`CUDA (+Python)`  |`CPU (+Python)`   |`OpenCL (+Python)`| `Debug`          | `Unity`          |
+| :---:            | :---:            | :---:            | :---:            | :---:            | :---:            | :---:            |
 | **`Linux`**   | [![Status](https://travis-matrix-badges.herokuapp.com/repos/CMU-Perceptual-Computing-Lab/openpose/branches/master/1)](https://travis-ci.org/CMU-Perceptual-Computing-Lab/openpose) | [![Status](https://travis-matrix-badges.herokuapp.com/repos/CMU-Perceptual-Computing-Lab/openpose/branches/master/2)](https://travis-ci.org/CMU-Perceptual-Computing-Lab/openpose) | [![Status](https://travis-matrix-badges.herokuapp.com/repos/CMU-Perceptual-Computing-Lab/openpose/branches/master/3)](https://travis-ci.org/CMU-Perceptual-Computing-Lab/openpose) | [![Status](https://travis-matrix-badges.herokuapp.com/repos/CMU-Perceptual-Computing-Lab/openpose/branches/master/4)](https://travis-ci.org/CMU-Perceptual-Computing-Lab/openpose) | [![Status](https://travis-matrix-badges.herokuapp.com/repos/CMU-Perceptual-Computing-Lab/openpose/branches/master/5)](https://travis-ci.org/CMU-Perceptual-Computing-Lab/openpose) | [![Status](https://travis-matrix-badges.herokuapp.com/repos/CMU-Perceptual-Computing-Lab/openpose/branches/master/6)](https://travis-ci.org/CMU-Perceptual-Computing-Lab/openpose) |
-| **`MacOS`**   | | [![Status](https://travis-matrix-badges.herokuapp.com/repos/CMU-Perceptual-Computing-Lab/openpose/branches/master/7)](https://travis-ci.org/CMU-Perceptual-Computing-Lab/openpose) | | [![Status](https://travis-matrix-badges.herokuapp.com/repos/CMU-Perceptual-Computing-Lab/openpose/branches/master/8)](https://travis-ci.org/CMU-Perceptual-Computing-Lab/openpose) | [![Status](https://travis-matrix-badges.herokuapp.com/repos/CMU-Perceptual-Computing-Lab/openpose/branches/master/9)](https://travis-ci.org/CMU-Perceptual-Computing-Lab/openpose) | [![Status](https://travis-matrix-badges.herokuapp.com/repos/CMU-Perceptual-Computing-Lab/openpose/branches/master/10)](https://travis-ci.org/CMU-Perceptual-Computing-Lab/openpose) |
+| **`MacOS`**   | [![Status](https://travis-matrix-badges.herokuapp.com/repos/CMU-Perceptual-Computing-Lab/openpose/branches/master/7)](https://travis-ci.org/CMU-Perceptual-Computing-Lab/openpose) | | [![Status](https://travis-matrix-badges.herokuapp.com/repos/CMU-Perceptual-Computing-Lab/openpose/branches/master/7)](https://travis-ci.org/CMU-Perceptual-Computing-Lab/openpose) | [![Status](https://travis-matrix-badges.herokuapp.com/repos/CMU-Perceptual-Computing-Lab/openpose/branches/master/8)](https://travis-ci.org/CMU-Perceptual-Computing-Lab/openpose) | [![Status](https://travis-matrix-badges.herokuapp.com/repos/CMU-Perceptual-Computing-Lab/openpose/branches/master/9)](https://travis-ci.org/CMU-Perceptual-Computing-Lab/openpose) | [![Status](https://travis-matrix-badges.herokuapp.com/repos/CMU-Perceptual-Computing-Lab/openpose/branches/master/10)](https://travis-ci.org/CMU-Perceptual-Computing-Lab/openpose) | [![Status](https://travis-matrix-badges.herokuapp.com/repos/CMU-Perceptual-Computing-Lab/openpose/branches/master/11)](https://travis-ci.org/CMU-Perceptual-Computing-Lab/openpose) |
 <!-- | **`Windows`** | | | | | | -->
 <!--
 Note: Currently using [travis-matrix-badges](https://github.com/bjfish/travis-matrix-badges) vs. traditional [![Build Status](https://travis-ci.org/CMU-Perceptual-Computing-Lab/openpose.svg?branch=master)](https://travis-ci.org/CMU-Perceptual-Computing-Lab/openpose)

--- a/doc/modules/calibration_module.md
+++ b/doc/modules/calibration_module.md
@@ -107,7 +107,7 @@ Examples:
 1. **VERY IMPORTANT NOTE**: If you want to re-run the extrinsic parameter calibration over the same intrinsic XML files (e.g., if you move the camera location, but you know the instrinsics are the same), you must manually re-set to `1 0 0 0  0 1 0 0  0 0 1 0` the camera matrix of each XML file that will be used for `--combine_cam0_extrinsics`.
 2. After intrinsics calibration, save undirtoted images for all the camera views:
 ```sh
-./build/examples/openpose/openpose.bin --num_gpu 0 --flir_camera --write_images ~/Desktop/extrinsics
+./build/examples/openpose/openpose.bin --num_gpu 0 --flir_camera --frame_undistort --write_images ~/Desktop/extrinsics
 ```
 3. Run the extrinsic calibration tool between each pair of close cameras. In this example:
 	- We assume camera 0 to the right, 1 in the middle-right, 2 in the middle-left, and 3 in the left.
@@ -151,3 +151,28 @@ Examples:
 If you plan to use the calibration tool without using OpenPose, you can manually save a video sequence of your desired camera into each of the camera image folders (i.e., in the above example, the `~/Desktop/intrinsics_0`, `~/Desktop/intrinsics_1`, etc. folders).

 If you wanna eventually run that camera with OpenPose, check [doc/modules/3d_reconstruction_module.md#using-a-different-camera-brand](./modules/3d_reconstruction_module.md#using-a-different-camera-brand).
+
+
+
+## Naming Convention for the Output Images
+The naming convention for the saved images is the following: `[%12d]_rendered[CAMERA_NUMBER_MINUS_1].png`, where `[CAMERA_NUMBER_MINUS_1]` is nothing for camera 0, `_1` for camera 1, `_2` for camera 2, etc. E.g., for 4 cameras:
+```
+000000000000_rendered.png
+000000000000_rendered_1.png
+000000000000_rendered_2.png
+000000000000_rendered_3.png
+000000000001_rendered.png
+000000000001_rendered_1.png
+000000000001_rendered_2.png
+000000000001_rendered_3.png
+[...]
+```
+
+OpenPose generates them with the base name `[%12d]_rendered`. Ideally, any other base number should work as long as the termination `[CAMERA_NUMBER_MINUS_1]` is kept consistent for all the camera views. E.g., you could call them also as follows (assuming 4 cameras):
+```
+a.png, a_1.png, a_2.png, a_3.png,
+b.png, b_1.png, b_2.png, b_3.png,
+etc.
+```
+
+Again, the critical step is to keep the file termination fixed as `_1`, `_2`, etc.
--- a/doc/modules/python_module.md
+++ b/doc/modules/python_module.md
@@ -13,6 +13,12 @@
 ## Introduction
 This module exposes a Python API for OpenPose. It is effectively a wrapper that replicates most of the functionality of the [op::Wrapper class](https://github.com/CMU-Perceptual-Computing-Lab/openpose/blob/master/include/openpose/wrapper/wrapper.hpp) and allows you to populate and retrieve data from the [op::Datum class](https://github.com/CMU-Perceptual-Computing-Lab/openpose/blob/master/include/openpose/core/datum.hpp) using standard Python and Numpy constructs.

+The Python API is analagous to the C++ function calls. You may find them in [python/openpose/openpose_python.cpp#L194](https://github.com/CMU-Perceptual-Computing-Lab/openpose/blob/master/python/openpose/openpose_python.cpp#L194).
+
+The Python API is rather simple: `op::Array<float>` and `cv::Mat` objects get casted to numpy arrays automatically. Every other data structure based on the standard library is automatically converted into Python objects. For example, an `std::vector<std::vector<float>>` would become `[[item, item], [item, item]]`, etc. We also provide a casting of `op::Rectangle` and `op::Point` which simply expose setter getter for [x, y, width, height], etc.
+
+
+


 ## Compatibility

--- a/include/openpose/pose/poseExtractorCaffe.hpp
+++ b/include/openpose/pose/poseExtractorCaffe.hpp
@@ -2,6 +2,12 @@
 #define OPENPOSE_POSE_POSE_EXTRACTOR_CAFFE_HPP

 #include <openpose/core/common.hpp>
+#include <openpose/net/bodyPartConnectorCaffe.hpp>
+#include <openpose/net/maximumCaffe.hpp>
+#include <openpose/net/netCaffe.hpp>
+#include <openpose/net/netOpenCv.hpp>
+#include <openpose/net/nmsCaffe.hpp>
+#include <openpose/net/resizeAndMergeCaffe.hpp>
 #include <openpose/pose/enumClasses.hpp>
 #include <openpose/pose/poseExtractorNet.hpp>

@@ -21,7 +27,7 @@ namespace op

        virtual ~PoseExtractorCaffe();

-        void netInitializationOnThread();
+        virtual void netInitializationOnThread();

        /**
         * @param poseNetOutput If it is not empty, OpenPose will not run its internal body pose estimation network
@@ -30,7 +36,7 @@ namespace op
         * modify the pose estimation flags to match the dimension of both elements (e.g., `--net_resolution`,
         * `--scale_number`, etc.).
         */
-        void forwardPass(
+        virtual void forwardPass(
            const std::vector<Array<float>>& inputNetData, const Point<int>& inputDataSize,
            const std::vector<double>& scaleInputToNetInputs = {1.f},
            const Array<float>& poseNetOutput = Array<float>{});
@@ -48,13 +54,28 @@ namespace op
        const float* getPoseGpuConstPtr() const;

    private:
-        // PIMPL idiom
-        // http://www.cppsamples.com/common-tasks/pimpl.html
-        struct ImplPoseExtractorCaffe;
-        std::unique_ptr<ImplPoseExtractorCaffe> upImpl;
+        // Used when increasing spNets
+        const PoseModel mPoseModel;
+        const int mGpuId;
+        const std::string mModelFolder;
+        const std::string mProtoTxtPath;
+        const std::string mCaffeModelPath;
+        const float mUpsamplingRatio;
+        const bool mEnableNet;
+        const bool mEnableGoogleLogging;
+        // General parameters
+        std::vector<std::shared_ptr<Net>> spNets;
+        std::shared_ptr<ResizeAndMergeCaffe<float>> spResizeAndMergeCaffe;
+        std::shared_ptr<NmsCaffe<float>> spNmsCaffe;
+        std::shared_ptr<BodyPartConnectorCaffe<float>> spBodyPartConnectorCaffe;
+        std::shared_ptr<MaximumCaffe<float>> spMaximumCaffe;
+        std::vector<std::vector<int>> mNetInput4DSizes;
+        // Init with thread
+        std::vector<std::shared_ptr<ArrayCpuGpu<float>>> spCaffeNetOutputBlobs;
+        std::shared_ptr<ArrayCpuGpu<float>> spHeatMapsBlob;
+        std::shared_ptr<ArrayCpuGpu<float>> spPeaksBlob;
+        std::shared_ptr<ArrayCpuGpu<float>> spMaximumPeaksBlob;

-        // PIMP requires DELETE_COPY & destructor, or extra code
-        // http://oliora.github.io/2015/12/29/pimpl-and-rule-of-zero.html
        DELETE_COPY(PoseExtractorCaffe);
    };
 }

--- a/scripts/travis/defaults.sh
+++ b/scripts/travis/defaults.sh
@@ -2,6 +2,7 @@

 # Set default environment variables
 set -e
+TRAVIS_OS_NAME=${TRAVIS_OS_NAME}
 WITH_CMAKE=${WITH_CMAKE:-true}
 WITH_PYTHON=${WITH_PYTHON:-false}
 WITH_CUDA=${WITH_CUDA:-true}
@@ -10,7 +11,6 @@ WITH_OPEN_CL=${WITH_OPEN_CL:-false}
 WITH_MKL=${WITH_MKL:-false}
 WITH_UNITY=${WITH_UNITY:-false}
 WITH_DEBUG=${WITH_DEBUG:-false}
-TRAVIS_OS_NAME=${TRAVIS_OS_NAME}

 # Examples should be run (Travis not compatible with GPU code)
 # if [[ $WITH_CMAKE == true ]] && [[ $WITH_PYTHON == true ]] && [[ $WITH_CUDA == false ]] && [[ $WITH_OPEN_CL == false ]] && [[ $WITH_MKL == false ]]; then

--- a/src/openpose/pose/poseExtractorCaffe.cpp
+++ b/src/openpose/pose/poseExtractorCaffe.cpp
 #include <limits> // std::numeric_limits
-#ifdef USE_CAFFE
-    #include <caffe/blob.hpp>
-#endif
 #include <openpose/gpu/cuda.hpp>
-#ifdef USE_OPENCL
-    #include <openpose/gpu/opencl.hcl>
-    #include <openpose/gpu/cl2.hpp>
-#endif
-#include <openpose/net/bodyPartConnectorCaffe.hpp>
-#include <openpose/net/maximumCaffe.hpp>
-#include <openpose/net/netCaffe.hpp>
-#include <openpose/net/netOpenCv.hpp>
-#include <openpose/net/nmsCaffe.hpp>
-#include <openpose/net/resizeAndMergeCaffe.hpp>
 #include <openpose/pose/poseParameters.hpp>
 #include <openpose/utilities/check.hpp>
 #include <openpose/utilities/fastMath.hpp>
@@ -25,52 +12,6 @@ namespace op
 {
    const bool TOP_DOWN_REFINEMENT = false; // Note: +5% acc 1 scale, -2% max acc setting

-    struct PoseExtractorCaffe::ImplPoseExtractorCaffe
-    {
-        #ifdef USE_CAFFE
-            // Used when increasing spNets
-            const PoseModel mPoseModel;
-            const int mGpuId;
-            const std::string mModelFolder;
-            const std::string mProtoTxtPath;
-            const std::string mCaffeModelPath;
-            const float mUpsamplingRatio;
-            const bool mEnableNet;
-            const bool mEnableGoogleLogging;
-            // General parameters
-            std::vector<std::shared_ptr<Net>> spNets;
-            std::shared_ptr<ResizeAndMergeCaffe<float>> spResizeAndMergeCaffe;
-            std::shared_ptr<NmsCaffe<float>> spNmsCaffe;
-            std::shared_ptr<BodyPartConnectorCaffe<float>> spBodyPartConnectorCaffe;
-            std::shared_ptr<MaximumCaffe<float>> spMaximumCaffe;
-            std::vector<std::vector<int>> mNetInput4DSizes;
-            // Init with thread
-            std::vector<std::shared_ptr<ArrayCpuGpu<float>>> spCaffeNetOutputBlobs;
-            std::shared_ptr<ArrayCpuGpu<float>> spHeatMapsBlob;
-            std::shared_ptr<ArrayCpuGpu<float>> spPeaksBlob;
-            std::shared_ptr<ArrayCpuGpu<float>> spMaximumPeaksBlob;
-
-            ImplPoseExtractorCaffe(
-                const PoseModel poseModel, const int gpuId, const std::string& modelFolder,
-                const std::string& protoTxtPath, const std::string& caffeModelPath,
-                const float upsamplingRatio, const bool enableNet, const bool enableGoogleLogging) :
-                mPoseModel{poseModel},
-                mGpuId{gpuId},
-                mModelFolder{modelFolder},
-                mProtoTxtPath{protoTxtPath},
-                mCaffeModelPath{caffeModelPath},
-                mUpsamplingRatio{upsamplingRatio},
-                mEnableNet{enableNet},
-                mEnableGoogleLogging{enableGoogleLogging},
-                spResizeAndMergeCaffe{std::make_shared<ResizeAndMergeCaffe<float>>()},
-                spNmsCaffe{std::make_shared<NmsCaffe<float>>()},
-                spBodyPartConnectorCaffe{std::make_shared<BodyPartConnectorCaffe<float>>()},
-                spMaximumCaffe{(TOP_DOWN_REFINEMENT ? std::make_shared<MaximumCaffe<float>>() : nullptr)}
-            {
-            }
-        #endif
-    };
-
    #ifdef USE_CAFFE
        std::vector<ArrayCpuGpu<float>*> arraySharedToPtr(
            const std::vector<std::shared_ptr<ArrayCpuGpu<float>>>& caffeNetOutputBlob)
@@ -171,18 +112,29 @@ namespace op
        const std::vector<HeatMapType>& heatMapTypes, const ScaleMode heatMapScaleMode, const bool addPartCandidates,
        const bool maximizePositives, const std::string& protoTxtPath, const std::string& caffeModelPath,
        const float upsamplingRatio, const bool enableNet, const bool enableGoogleLogging) :
-        PoseExtractorNet{poseModel, heatMapTypes, heatMapScaleMode, addPartCandidates, maximizePositives}
+        PoseExtractorNet{poseModel, heatMapTypes, heatMapScaleMode, addPartCandidates, maximizePositives},
+        mPoseModel{poseModel},
+        mGpuId{gpuId},
+        mModelFolder{modelFolder},
+        mProtoTxtPath{protoTxtPath},
+        mCaffeModelPath{caffeModelPath},
+        mUpsamplingRatio{upsamplingRatio},
+        mEnableNet{enableNet},
+        mEnableGoogleLogging{enableGoogleLogging}
        #ifdef USE_CAFFE
-        , upImpl{new ImplPoseExtractorCaffe{poseModel, gpuId, modelFolder, protoTxtPath, caffeModelPath,
-                 upsamplingRatio, enableNet, enableGoogleLogging}}
+            ,
+            spResizeAndMergeCaffe{std::make_shared<ResizeAndMergeCaffe<float>>()},
+            spNmsCaffe{std::make_shared<NmsCaffe<float>>()},
+            spBodyPartConnectorCaffe{std::make_shared<BodyPartConnectorCaffe<float>>()},
+            spMaximumCaffe{(TOP_DOWN_REFINEMENT ? std::make_shared<MaximumCaffe<float>>() : nullptr)}
        #endif
    {
        try
        {
            #ifdef USE_CAFFE
                // Layers parameters
-                upImpl->spBodyPartConnectorCaffe->setPoseModel(upImpl->mPoseModel);
-                upImpl->spBodyPartConnectorCaffe->setMaximizePositives(maximizePositives);
+                spBodyPartConnectorCaffe->setPoseModel(mPoseModel);
+                spBodyPartConnectorCaffe->setMaximizePositives(maximizePositives);
            #else
                UNUSED(poseModel);
                UNUSED(modelFolder);
@@ -213,24 +165,24 @@ namespace op
        try
        {
            #ifdef USE_CAFFE
-                if (upImpl->mEnableNet)
+                if (mEnableNet)
                {
                    // Logging
                    log("Starting initialization on thread.", Priority::Low, __LINE__, __FUNCTION__, __FILE__);
                    // Initialize Caffe net
                    addCaffeNetOnThread(
-                        upImpl->spNets, upImpl->spCaffeNetOutputBlobs, upImpl->mPoseModel, upImpl->mGpuId,
-                        upImpl->mModelFolder, upImpl->mProtoTxtPath, upImpl->mCaffeModelPath,
-                        upImpl->mEnableGoogleLogging);
+                        spNets, spCaffeNetOutputBlobs, mPoseModel, mGpuId,
+                        mModelFolder, mProtoTxtPath, mCaffeModelPath,
+                        mEnableGoogleLogging);
                    #ifdef USE_CUDA
                        cudaCheck(__LINE__, __FUNCTION__, __FILE__);
                    #endif
                }
                // Initialize blobs
-                upImpl->spHeatMapsBlob = {std::make_shared<ArrayCpuGpu<float>>(1,1,1,1)};
-                upImpl->spPeaksBlob = {std::make_shared<ArrayCpuGpu<float>>(1,1,1,1)};
+                spHeatMapsBlob = {std::make_shared<ArrayCpuGpu<float>>(1,1,1,1)};
+                spPeaksBlob = {std::make_shared<ArrayCpuGpu<float>>(1,1,1,1)};
                if (TOP_DOWN_REFINEMENT)
-                    upImpl->spMaximumPeaksBlob = {std::make_shared<ArrayCpuGpu<float>>(1,1,1,1)};
+                    spMaximumPeaksBlob = {std::make_shared<ArrayCpuGpu<float>>(1,1,1,1)};
                #ifdef USE_CUDA
                    cudaCheck(__LINE__, __FUNCTION__, __FILE__);
                #endif
@@ -260,7 +212,7 @@ namespace op
                if (inputNetData.size() != scaleInputToNetInputs.size())
                    error("Size(inputNetData) must be same than size(scaleInputToNetInputs).",
                          __LINE__, __FUNCTION__, __FILE__);
-                if (poseNetOutput.empty() != upImpl->mEnableNet)
+                if (poseNetOutput.empty() != mEnableNet)
                {
                    const std::string errorMsg = ". Either use OpenPose default network (`--body 1`) or fill the"
                        " `poseNetOutput` argument (only 1 of those 2, not both).";
@@ -274,18 +226,18 @@ namespace op

                // Resize std::vectors if required
                const auto numberScales = inputNetData.size();
-                upImpl->mNetInput4DSizes.resize(numberScales);
+                mNetInput4DSizes.resize(numberScales);

                // Process each image - Caffe deep network
-                if (upImpl->mEnableNet)
+                if (mEnableNet)
                {
-                    while (upImpl->spNets.size() < numberScales)
+                    while (spNets.size() < numberScales)
                        addCaffeNetOnThread(
-                            upImpl->spNets, upImpl->spCaffeNetOutputBlobs, upImpl->mPoseModel, upImpl->mGpuId,
-                            upImpl->mModelFolder, upImpl->mProtoTxtPath, upImpl->mCaffeModelPath, false);
+                            spNets, spCaffeNetOutputBlobs, mPoseModel, mGpuId,
+                            mModelFolder, mProtoTxtPath, mCaffeModelPath, false);

                    for (auto i = 0u ; i < inputNetData.size(); i++)
-                        upImpl->spNets.at(i)->forwardPass(inputNetData[i]);
+                        spNets.at(i)->forwardPass(inputNetData[i]);
                }
                // If custom network output
                else
@@ -296,9 +248,9 @@ namespace op
                              + std::to_string(inputNetData.size()) + " vs. " + std::to_string(1) + ").",
                              __LINE__, __FUNCTION__, __FILE__);
                    // Copy heatmap information
-                    upImpl->spCaffeNetOutputBlobs.clear();
+                    spCaffeNetOutputBlobs.clear();
                    const bool copyFromGpu = false;
-                    upImpl->spCaffeNetOutputBlobs.emplace_back(
+                    spCaffeNetOutputBlobs.emplace_back(
                        std::make_shared<ArrayCpuGpu<float>>(poseNetOutput, copyFromGpu));
                }
                // Reshape blobs if required
@@ -306,33 +258,33 @@ namespace op
                {
                    // Reshape blobs if required - For dynamic sizes (e.g., images of different aspect ratio)
                    const auto changedVectors = !vectorsAreEqual(
-                        upImpl->mNetInput4DSizes.at(i), inputNetData[i].getSize());
+                        mNetInput4DSizes.at(i), inputNetData[i].getSize());
                    if (changedVectors)
                    {
-                        upImpl->mNetInput4DSizes.at(i) = inputNetData[i].getSize();
+                        mNetInput4DSizes.at(i) = inputNetData[i].getSize();
                        reshapePoseExtractorCaffe(
-                            upImpl->spResizeAndMergeCaffe, upImpl->spNmsCaffe, upImpl->spBodyPartConnectorCaffe,
-                            upImpl->spMaximumCaffe, upImpl->spCaffeNetOutputBlobs, upImpl->spHeatMapsBlob,
-                            upImpl->spPeaksBlob, upImpl->spMaximumPeaksBlob, 1.f, upImpl->mPoseModel,
-                            upImpl->mGpuId, upImpl->mUpsamplingRatio);
+                            spResizeAndMergeCaffe, spNmsCaffe, spBodyPartConnectorCaffe,
+                            spMaximumCaffe, spCaffeNetOutputBlobs, spHeatMapsBlob,
+                            spPeaksBlob, spMaximumPeaksBlob, 1.f, mPoseModel,
+                            mGpuId, mUpsamplingRatio);
                            // In order to resize to input size to have same results as Matlab
                            // scaleInputToNetInputs[i] vs. 1.f
                    }
                    // Get scale net to output (i.e., image input)
                    const auto ratio = (
-                        upImpl->mUpsamplingRatio <= 0.f
-                            ? 1 : upImpl->mUpsamplingRatio / getPoseNetDecreaseFactor(mPoseModel));
+                        mUpsamplingRatio <= 0.f
+                            ? 1 : mUpsamplingRatio / getPoseNetDecreaseFactor(mPoseModel));
                    if (changedVectors || TOP_DOWN_REFINEMENT)
                        mNetOutputSize = Point<int>{
-                            positiveIntRound(ratio*upImpl->mNetInput4DSizes[0][3]),
-                            positiveIntRound(ratio*upImpl->mNetInput4DSizes[0][2])};
+                            positiveIntRound(ratio*mNetInput4DSizes[0][3]),
+                            positiveIntRound(ratio*mNetInput4DSizes[0][2])};
                }
                // 2. Resize heat maps + merge different scales
                // ~5ms (GPU) / ~20ms (CPU)
-                const auto caffeNetOutputBlobs = arraySharedToPtr(upImpl->spCaffeNetOutputBlobs);
+                const auto caffeNetOutputBlobs = arraySharedToPtr(spCaffeNetOutputBlobs);
                const std::vector<float> floatScaleRatios(scaleInputToNetInputs.begin(), scaleInputToNetInputs.end());
-                upImpl->spResizeAndMergeCaffe->setScaleRatios(floatScaleRatios);
-                upImpl->spResizeAndMergeCaffe->Forward(caffeNetOutputBlobs, {upImpl->spHeatMapsBlob.get()});
+                spResizeAndMergeCaffe->setScaleRatios(floatScaleRatios);
+                spResizeAndMergeCaffe->Forward(caffeNetOutputBlobs, {spHeatMapsBlob.get()});
                // Get scale net to output (i.e., image input)
                // Note: In order to resize to input size, (un)comment the following lines
                const auto scaleProducerToNetInput = resizeGetScaleFactor(inputDataSize, mNetOutputSize);
@@ -344,20 +296,20 @@ namespace op
                // 3. Get peaks by Non-Maximum Suppression
                // ~2ms (GPU) / ~7ms (CPU)
                const auto nmsThreshold = (float)get(PoseProperty::NMSThreshold);
-                upImpl->spNmsCaffe->setThreshold(nmsThreshold);
+                spNmsCaffe->setThreshold(nmsThreshold);
                const auto nmsOffset = float(0.5/double(mScaleNetToOutput));
-                upImpl->spNmsCaffe->setOffset(Point<float>{nmsOffset, nmsOffset});
-                upImpl->spNmsCaffe->Forward({upImpl->spHeatMapsBlob.get()}, {upImpl->spPeaksBlob.get()});
+                spNmsCaffe->setOffset(Point<float>{nmsOffset, nmsOffset});
+                spNmsCaffe->Forward({spHeatMapsBlob.get()}, {spPeaksBlob.get()});
                // 4. Connecting body parts
-                upImpl->spBodyPartConnectorCaffe->setScaleNetToOutput(mScaleNetToOutput);
-                upImpl->spBodyPartConnectorCaffe->setInterMinAboveThreshold(
+                spBodyPartConnectorCaffe->setScaleNetToOutput(mScaleNetToOutput);
+                spBodyPartConnectorCaffe->setInterMinAboveThreshold(
                    (float)get(PoseProperty::ConnectInterMinAboveThreshold));
-                upImpl->spBodyPartConnectorCaffe->setInterThreshold((float)get(PoseProperty::ConnectInterThreshold));
-                upImpl->spBodyPartConnectorCaffe->setMinSubsetCnt((int)get(PoseProperty::ConnectMinSubsetCnt));
-                upImpl->spBodyPartConnectorCaffe->setMinSubsetScore((float)get(PoseProperty::ConnectMinSubsetScore));
+                spBodyPartConnectorCaffe->setInterThreshold((float)get(PoseProperty::ConnectInterThreshold));
+                spBodyPartConnectorCaffe->setMinSubsetCnt((int)get(PoseProperty::ConnectMinSubsetCnt));
+                spBodyPartConnectorCaffe->setMinSubsetScore((float)get(PoseProperty::ConnectMinSubsetScore));
                // Note: BODY_25D will crash (only implemented for CPU version)
-                upImpl->spBodyPartConnectorCaffe->Forward(
-                    {upImpl->spHeatMapsBlob.get(), upImpl->spPeaksBlob.get()}, mPoseKeypoints, mPoseScores);
+                spBodyPartConnectorCaffe->Forward(
+                    {spHeatMapsBlob.get(), spPeaksBlob.get()}, mPoseKeypoints, mPoseScores);
                // Re-run on each person
                if (TOP_DOWN_REFINEMENT)
                {
@@ -450,46 +402,46 @@ namespace op

                            // Re-Process image
                            // 1. Caffe deep network
-                            upImpl->spNets.at(0)->forwardPass(inputNetDataRoi);
+                            spNets.at(0)->forwardPass(inputNetDataRoi);
                            std::vector<std::shared_ptr<ArrayCpuGpu<float>>> caffeNetOutputBlob{
-                                upImpl->spCaffeNetOutputBlobs[0]};
+                                spCaffeNetOutputBlobs[0]};
                            // Reshape blobs
-                            if (!vectorsAreEqual(upImpl->mNetInput4DSizes.at(0), inputNetDataRoi.getSize()))
+                            if (!vectorsAreEqual(mNetInput4DSizes.at(0), inputNetDataRoi.getSize()))
                            {
-                                upImpl->mNetInput4DSizes.at(0) = inputNetDataRoi.getSize();
+                                mNetInput4DSizes.at(0) = inputNetDataRoi.getSize();
                                reshapePoseExtractorCaffe(
-                                    upImpl->spResizeAndMergeCaffe, upImpl->spNmsCaffe,
-                                    upImpl->spBodyPartConnectorCaffe, upImpl->spMaximumCaffe,
-                                    // upImpl->spCaffeNetOutputBlobs,
-                                    caffeNetOutputBlob, upImpl->spHeatMapsBlob, upImpl->spPeaksBlob,
-                                    upImpl->spMaximumPeaksBlob, 1.f, upImpl->mPoseModel, upImpl->mGpuId,
-                                    upImpl->mUpsamplingRatio);
+                                    spResizeAndMergeCaffe, spNmsCaffe,
+                                    spBodyPartConnectorCaffe, spMaximumCaffe,
+                                    // spCaffeNetOutputBlobs,
+                                    caffeNetOutputBlob, spHeatMapsBlob, spPeaksBlob,
+                                    spMaximumPeaksBlob, 1.f, mPoseModel, mGpuId,
+                                    mUpsamplingRatio);
                            }
                            // 2. Resize heat maps + merge different scales
                            const auto caffeNetOutputBlobs = arraySharedToPtr(caffeNetOutputBlob);
                            // const std::vector<float> floatScaleRatios(
                            //     scaleInputToNetInputs.begin(), scaleInputToNetInputs.end());
                            const std::vector<float> floatScaleRatios{(float)scaleInputToNetInputs[0]};
-                            upImpl->spResizeAndMergeCaffe->setScaleRatios(floatScaleRatios);
-                            upImpl->spResizeAndMergeCaffe->Forward(
-                                caffeNetOutputBlobs, {upImpl->spHeatMapsBlob.get()});
+                            spResizeAndMergeCaffe->setScaleRatios(floatScaleRatios);
+                            spResizeAndMergeCaffe->Forward(
+                                caffeNetOutputBlobs, {spHeatMapsBlob.get()});
                            // Get scale net to output (i.e., image input)
                            const auto scaleRoiToOutput = float(mScaleNetToOutput / scaleNetToRoi);
                            // 3. Get peaks by Non-Maximum Suppression
                            const auto nmsThresholdRefined = 0.02f;
-                            upImpl->spNmsCaffe->setThreshold(nmsThresholdRefined);
+                            spNmsCaffe->setThreshold(nmsThresholdRefined);
                            const auto nmsOffset = float(0.5/double(scaleRoiToOutput));
-                            upImpl->spNmsCaffe->setOffset(Point<float>{nmsOffset, nmsOffset});
-                            upImpl->spNmsCaffe->Forward({upImpl->spHeatMapsBlob.get()}, {upImpl->spPeaksBlob.get()});
+                            spNmsCaffe->setOffset(Point<float>{nmsOffset, nmsOffset});
+                            spNmsCaffe->Forward({spHeatMapsBlob.get()}, {spPeaksBlob.get()});
                            // Define poseKeypoints
                            Array<float> poseKeypoints;
                            Array<float> poseScores;
                            // 4. Connecting body parts
                            // Get scale net to output (i.e., image input)
-                            upImpl->spBodyPartConnectorCaffe->setScaleNetToOutput(scaleRoiToOutput);
-                            upImpl->spBodyPartConnectorCaffe->setInterThreshold(0.01f);
-                            upImpl->spBodyPartConnectorCaffe->Forward(
-                                {upImpl->spHeatMapsBlob.get(), upImpl->spPeaksBlob.get()}, poseKeypoints, poseScores);
+                            spBodyPartConnectorCaffe->setScaleNetToOutput(scaleRoiToOutput);
+                            spBodyPartConnectorCaffe->setInterThreshold(0.01f);
+                            spBodyPartConnectorCaffe->Forward(
+                                {spHeatMapsBlob.get(), spPeaksBlob.get()}, poseKeypoints, poseScores);
                            // If detected people in new subnet
                            if (!poseKeypoints.empty())
                            {
@@ -603,10 +555,10 @@ namespace op
                                        //     if (!overlappingPerson)
                                        //     {
                                        //         // Get keypoint with maximum probability per channel
-                                        //         upImpl->spMaximumCaffe->Forward(
-                                        //             {upImpl->spHeatMapsBlob.get()}, {upImpl->spMaximumPeaksBlob.get()});
+                                        //         spMaximumCaffe->Forward(
+                                        //             {spHeatMapsBlob.get()}, {spMaximumPeaksBlob.get()});
                                        //         // Fill gaps
-                                        //         const auto* posePeaksPtr = upImpl->spMaximumPeaksBlob->mutable_cpu_data();
+                                        //         const auto* posePeaksPtr = spMaximumPeaksBlob->mutable_cpu_data();
                                        //         for (auto part = 0 ; part < mPoseKeypoints.getSize(1) ; part++)
                                        //         {
                                        //             // For currently empty keypoints
@@ -660,7 +612,7 @@ namespace op
        {
            #ifdef USE_CAFFE
                checkThread();
-                return upImpl->spPeaksBlob->cpu_data();
+                return spPeaksBlob->cpu_data();
            #else
                return nullptr;
            #endif
@@ -678,7 +630,7 @@ namespace op
        {
            #ifdef USE_CAFFE
                checkThread();
-                return upImpl->spPeaksBlob->gpu_data();
+                return spPeaksBlob->gpu_data();
            #else
                return nullptr;
            #endif
@@ -696,7 +648,7 @@ namespace op
        {
            #ifdef USE_CAFFE
                checkThread();
-                return upImpl->spHeatMapsBlob->cpu_data();
+                return spHeatMapsBlob->cpu_data();
            #else
                return nullptr;
            #endif
@@ -714,7 +666,7 @@ namespace op
        {
            #ifdef USE_CAFFE
                checkThread();
-                return upImpl->spHeatMapsBlob->gpu_data();
+                return spHeatMapsBlob->gpu_data();
            #else
                return nullptr;
            #endif
@@ -732,7 +684,7 @@ namespace op
        {
            #ifdef USE_CAFFE
                checkThread();
-                return upImpl->spHeatMapsBlob->shape();
+                return spHeatMapsBlob->shape();
            #else
                return {};
            #endif