MyBlender.cpp

//
//
//

//#include <nmmintrin.h>
#include "MyBlender.h"

namespace cv {
namespace detail {


MyBlender::MyBlender(int try_gpu)
{
	use_gpu = false;

	if (try_gpu)
	{
		if (gpu::getCudaEnabledDeviceCount() > 0)
		{
			use_gpu = true;
		}
	}
}

void MyBlender::prepare(Rect dst_roi)
{
	/*
	dst_.create(dst_roi.size(), CV_8UC3);
    dst_.setTo(Scalar::all(0));
	if (use_gpu)
	{
		gpuDst_.upload(dst_);
	}
	*/
    dst_mask_.create(dst_roi.size(), CV_8U);
    dst_mask_.setTo(Scalar::all(0));
    dst_roi_ = dst_roi;
}

void MyBlender::feed(const Mat &img, const Mat &mask, Point tl)
{
	CV_Assert(img.type() == CV_8UC3 || img.type() == CV_16SC3); // 両方受け付ける
    CV_Assert(mask.type() == CV_8U);
 
	// ここで入力に応じてdst_を作成する
	if (dst_.empty()) {
		dst_.create(dst_roi_.size(), img.type());
		dst_.setTo(Scalar::all(0));
//#ifndef JETSON_TK1
		if (use_gpu)
		{
			gpuDst_.upload(dst_);
		}
//#endif
	}

	int dx = tl.x - dst_roi_.x;
    int dy = tl.y - dst_roi_.y;

	if (use_gpu)
	{
//#ifdef JETSON_TK1
//		cv::gpu::device::cudaFeed(img, mask, dst_, dx, dy);
//#else
		cv::gpu::device::cudaFeed(img, mask, gpuDst_, dx, dy);
//#endif
	}
	else if (img.type() == CV_8UC3)
	{
#ifdef	_OPENMP
#		pragma omp parallel for
#endif
		for (int y = 0; y < img.rows; ++y)
		{
			const Point3_<uchar> *src_row = img.ptr<Point3_<uchar> >(y);
			const uchar *mask_row = mask.ptr<uchar>(y);
			Point3_<uchar> *dst_row = dst_.ptr<Point3_<uchar> >(dy + y);
			uchar *dst_mask_row = dst_mask_.ptr<uchar>(dy + y);

			for (int x = 0; x < img.cols; ++x)
			{
				if (mask_row[x])
					dst_row[dx + x] = src_row[x];
				dst_mask_row[dx + x] |= mask_row[x];
			}
		}
	}
	else // CV_16SC3
	{
#ifdef	_OPENMP
#		pragma omp parallel for
#endif
		for (int y = 0; y < img.rows; ++y)
		{
			const Point3_<short> *src_row = img.ptr<Point3_<short> >(y);
			const uchar *mask_row = mask.ptr<uchar>(y);
			Point3_<short> *dst_row = dst_.ptr<Point3_<short> >(dy + y);
			uchar *dst_mask_row = dst_mask_.ptr<uchar>(dy + y);

			for (int x = 0; x < img.cols; ++x)
			{
				if (mask_row[x])
					dst_row[dx + x] = src_row[x];
				dst_mask_row[dx + x] |= mask_row[x];
			}
		}
	}
}

void MyBlender::feed(const gpu::GpuMat &img, const gpu::GpuMat &mask, Point tl)
{
	CV_Assert(img.type() == CV_8UC3);
    CV_Assert(mask.type() == CV_8U);
	// ここで入力に応じてdst_を作成する
	if (dst_.empty()) {
		dst_.create(dst_roi_.size(), img.type());
		dst_.setTo(Scalar::all(0));
		if (use_gpu)
		{
			gpuDst_.upload(dst_);
		}	
	}

    int dx = tl.x - dst_roi_.x;
    int dy = tl.y - dst_roi_.y;

	cv::gpu::device::cudaFeed(img, mask, gpuDst_, dx, dy);
}

void MyBlender::blend(Mat &dst, Mat &dst_mask)
{
	if (use_gpu)
	{
//#ifndef JETSON_TK1
		gpuDst_.download(dst);
		gpuDst_.release();
//#endif
	}
	else 
	{
		dst_.setTo(Scalar::all(0), dst_mask_ == 0);
		dst = dst_;
	}
    dst_mask = dst_mask_;
    dst_.release();
    dst_mask_.release();
}

} // namespace detail
} // namespace cv