Added source code

mp3guy · Oct 30, 2015 · 544da79 · 544da79
1 parent 0dbf2bf
commit 544da79
Show file tree

Hide file tree

Showing 120 changed files with 17,413 additions and 1 deletion.
diff --git a/.gitignore b/.gitignore
@@ -0,0 +1,4 @@
+build/
+deps/
+.project
+.cproject
diff --git a/Core/src/CMakeLists.txt b/Core/src/CMakeLists.txt
@@ -0,0 +1,53 @@
+cmake_minimum_required(VERSION 2.6.0)
+
+project(libefusion)
+
+set(CMAKE_MODULE_PATH ${CMAKE_MODULE_PATH} "${CMAKE_CURRENT_SOURCE_DIR}")
+
+find_package(Pangolin 0.1 REQUIRED)
+find_package(CUDA REQUIRED)
+find_package(SuiteSparse REQUIRED)
+
+set(efusion_SHADER_DIR "${CMAKE_CURRENT_SOURCE_DIR}/Shaders" CACHE PATH "Where the shaders live")
+
+include_directories(${Pangolin_INCLUDE_DIRS})
+include_directories(${CUDA_INCLUDE_DIRS})
+include_directories(${EIGEN_INCLUDE_DIRS})
+include_directories(${SUITESPARSE_INCLUDE_DIRS})
+
+file(GLOB srcs *.cpp)
+file(GLOB utils_srcs Utils/*.cpp)
+file(GLOB shader_srcs Shaders/*.cpp)
+file(GLOB cuda Cuda/*.cu)
+file(GLOB containers Cuda/containers/*.cpp)
+
+set(CUDA_ARCH_BIN "20 30 35 50 52" CACHE STRING "Specify 'real' GPU arch to build binaries for, BIN(PTX) format is supported. Example: 1.3 2.1(1.3) or 13 21(13)")
+set(CUDA_ARCH_PTX "" CACHE STRING "Specify 'virtual' PTX arch to build PTX intermediate code for. Example: 1.0 1.2 or 10 12")              
+
+SET(CMAKE_MODULE_PATH ${CMAKE_MODULE_PATH} ${CMAKE_CURRENT_SOURCE_DIR})
+include(CudaComputeTargetFlags.cmake)                  
+APPEND_TARGET_ARCH_FLAGS()
+
+set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS}  "-Xcompiler;-fPIC;")           
+set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS} "--ftz=true;--prec-div=false;--prec-sqrt=false") 
+
+CUDA_COMPILE(cuda_objs ${cuda})
+
+set(CMAKE_CXX_FLAGS "-O3 -msse2 -msse3 -Wall -std=c++11 -DSHADER_DIR=${efusion_SHADER_DIR}")
+#set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -g -Wall -std=c++11 -DSHADER_DIR=${efusion_SHADER_DIR}")
+
+add_library(efusion SHARED 
+            ${srcs}
+            ${utils_srcs}
+            ${shader_srcs}
+            ${cuda} 
+            ${cuda_objs} 
+            ${containers}
+)
+
+target_link_libraries(efusion
+                      ${Eigen_LIBRARIES}
+                      ${Pangolin_LIBRARIES}
+                      ${CUDA_LIBRARIES}
+                      ${SUITESPARSE_LIBRARIES}
+)
diff --git a/Core/src/Cuda/containers/device_array.hpp b/Core/src/Cuda/containers/device_array.hpp
@@ -0,0 +1,257 @@
+/*
+ * Software License Agreement (BSD License)
+ *
+ *  Copyright (c) 2011, Willow Garage, Inc.
+ *  All rights reserved.
+ *
+ *  Redistribution and use in source and binary forms, with or without
+ *  modification, are permitted provided that the following conditions
+ *  are met:
+ *
+ *   * Redistributions of source code must retain the above copyright
+ *     notice, this list of conditions and the following disclaimer.
+ *   * Redistributions in binary form must reproduce the above
+ *     copyright notice, this list of conditions and the following
+ *     disclaimer in the documentation and/or other materials provided
+ *     with the distribution.
+ *   * Neither the name of Willow Garage, Inc. nor the names of its
+ *     contributors may be used to endorse or promote products derived
+ *     from this software without specific prior written permission.
+ *
+ *  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+ *  "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+ *  LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
+ *  FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
+ *  COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
+ *  INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
+ *  BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+ *  LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+ *  CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+ *  LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
+ *  ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
+ *  POSSIBILITY OF SUCH DAMAGE.
+ *
+ *  Author: Anatoly Baskeheev, Itseez Ltd, ([email protected])
+ */
+
+#ifndef DEVICE_ARRAY_HPP_
+#define DEVICE_ARRAY_HPP_
+
+#include "device_memory.hpp"
+
+#include <vector>
+//////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
+/** \brief @b DeviceArray class
+  *
+  * \note Typed container for GPU memory with reference counting.
+  *
+  * \author Anatoly Baksheev
+  */
+template<class T>
+class DeviceArray : public DeviceMemory
+{
+    public:
+        /** \brief Element type. */
+        typedef T type;
+
+        /** \brief Element size. */
+        enum { elem_size = sizeof(T) };
+
+        /** \brief Empty constructor. */
+        DeviceArray();
+
+        /** \brief Allocates internal buffer in GPU memory
+          * \param size_t: number of elements to allocate
+          * */
+        DeviceArray(size_t size);
+
+        /** \brief Initializes with user allocated buffer. Reference counting is disabled in this case.
+          * \param ptr: pointer to buffer
+          * \param size: elemens number
+          * */
+        DeviceArray(T *ptr, size_t size);
+
+        /** \brief Copy constructor. Just increments reference counter. */
+        DeviceArray(const DeviceArray& other);
+
+        /** \brief Assigment operator. Just increments reference counter. */
+        DeviceArray& operator = (const DeviceArray& other);
+
+        /** \brief Allocates internal buffer in GPU memory. If internal buffer was created before the function recreates it with new size. If new and old sizes are equal it does nothing.
+          * \param size: elemens number
+          * */
+        void create(size_t size);
+
+        /** \brief Decrements reference counter and releases internal buffer if needed. */
+        void release();
+
+        /** \brief Performs data copying. If destination size differs it will be reallocated.
+          * \param other_arg: destination container
+          * */
+        void copyTo(DeviceArray& other) const;
+
+        /** \brief Uploads data to internal buffer in GPU memory. It calls create() inside to ensure that intenal buffer size is enough.
+          * \param host_ptr_arg: pointer to buffer to upload
+          * \param size: elemens number
+          * */
+        void upload(const T *host_ptr, size_t size);
+
+        /** \brief Downloads data from internal buffer to CPU memory
+          * \param host_ptr_arg: pointer to buffer to download
+          * */
+        void download(T *host_ptr) const;
+
+        /** \brief Uploads data to internal buffer in GPU memory. It calls create() inside to ensure that intenal buffer size is enough.
+          * \param data: host vector to upload from
+          * */
+        template<class A>
+        void upload(const std::vector<T, A>& data);
+
+         /** \brief Downloads data from internal buffer to CPU memory
+           * \param data:  host vector to download to
+           * */
+        template<typename A>
+        void download(std::vector<T, A>& data) const;
+
+        /** \brief Performs swap of data pointed with another device array.
+          * \param other: device array to swap with
+          * */
+        void swap(DeviceArray& other_arg);
+
+        /** \brief Returns pointer for internal buffer in GPU memory. */
+        T* ptr();
+
+        /** \brief Returns const pointer for internal buffer in GPU memory. */
+        const T* ptr() const;
+
+        //using DeviceMemory::ptr;
+
+        /** \brief Returns pointer for internal buffer in GPU memory. */
+        operator T*();
+
+        /** \brief Returns const pointer for internal buffer in GPU memory. */
+        operator const T*() const;
+
+        /** \brief Returns size in elements. */
+        size_t size() const;
+};
+
+
+//////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
+/** \brief @b DeviceArray2D class
+  *
+  * \note Typed container for pitched GPU memory with reference counting.
+  *
+  * \author Anatoly Baksheev
+  */
+template<class T>
+class DeviceArray2D : public DeviceMemory2D
+{
+    public:
+        /** \brief Element type. */
+        typedef T type;
+
+        /** \brief Element size. */
+        enum { elem_size = sizeof(T) };
+
+        /** \brief Empty constructor. */
+        DeviceArray2D();
+
+        /** \brief Allocates internal buffer in GPU memory
+          * \param rows: number of rows to allocate
+          * \param cols: number of elements in each row
+          * */
+        DeviceArray2D(int rows, int cols);
+
+         /** \brief Initializes with user allocated buffer. Reference counting is disabled in this case.
+          * \param rows: number of rows
+          * \param cols: number of elements in each row
+          * \param data: pointer to buffer
+          * \param stepBytes: stride between two consecutive rows in bytes
+          * */
+        DeviceArray2D(int rows, int cols, void *data, size_t stepBytes);
+
+        /** \brief Copy constructor. Just increments reference counter. */
+        DeviceArray2D(const DeviceArray2D& other);
+
+        /** \brief Assigment operator. Just increments reference counter. */
+        DeviceArray2D& operator = (const DeviceArray2D& other);
+
+        /** \brief Allocates internal buffer in GPU memory. If internal buffer was created before the function recreates it with new size. If new and old sizes are equal it does nothing.
+           * \param rows: number of rows to allocate
+           * \param cols: number of elements in each row
+           * */
+        void create(int rows, int cols);
+
+        /** \brief Decrements reference counter and releases internal buffer if needed. */
+        void release();
+
+        /** \brief Performs data copying. If destination size differs it will be reallocated.
+          * \param other: destination container
+          * */
+        void copyTo(DeviceArray2D& other) const;
+
+        /** \brief Uploads data to internal buffer in GPU memory. It calls create() inside to ensure that intenal buffer size is enough.
+          * \param host_ptr: pointer to host buffer to upload
+          * \param host_step: stride between two consecutive rows in bytes for host buffer
+          * \param rows: number of rows to upload
+          * \param cols: number of elements in each row
+          * */
+        void upload(const void *host_ptr, size_t host_step, int rows, int cols);
+
+        /** \brief Downloads data from internal buffer to CPU memory. User is resposible for correct host buffer size.
+          * \param host_ptr: pointer to host buffer to download
+          * \param host_step: stride between two consecutive rows in bytes for host buffer
+          * */
+        void download(void *host_ptr, size_t host_step) const;
+
+        /** \brief Performs swap of data pointed with another device array.
+          * \param other: device array to swap with
+          * */
+        void swap(DeviceArray2D& other_arg);
+
+        /** \brief Uploads data to internal buffer in GPU memory. It calls create() inside to ensure that intenal buffer size is enough.
+          * \param data: host vector to upload from
+          * \param cols: stride in elements between  two consecutive rows in bytes for host buffer
+          * */
+        template<class A>
+        void upload(const std::vector<T, A>& data, int cols);
+
+        /** \brief Downloads data from internal buffer to CPU memory
+           * \param data: host vector to download to
+           * \param cols: Output stride in elements between two consecutive rows in bytes for host vector.
+           * */
+        template<class A>
+        void download(std::vector<T, A>& data, int& cols) const;
+
+        /** \brief Returns pointer to given row in internal buffer.
+          * \param y_arg: row index
+          * */
+        T* ptr(int y = 0);
+
+        /** \brief Returns const pointer to given row in internal buffer.
+          * \param y_arg: row index
+          * */
+        const T* ptr(int y = 0) const;
+
+        //using DeviceMemory2D::ptr;
+
+        /** \brief Returns pointer for internal buffer in GPU memory. */
+        operator T*();
+
+        /** \brief Returns const pointer for internal buffer in GPU memory. */
+        operator const T*() const;
+
+        /** \brief Returns number of elements in each row. */
+        int cols() const;
+
+        /** \brief Returns number of rows. */
+        int rows() const;
+
+        /** \brief Returns step in elements. */
+        size_t elem_step() const;
+};
+
+#include "device_array_impl.hpp"
+
+#endif /* DEVICE_ARRAY_HPP_ */