blob: ddd765f56568e27f91a210568fe437c473af206b [file] [log] [blame]
/*
* test-image-stitching.cpp - test image stitching
*
* Copyright (c) 2016 Intel Corporation
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
* Author: Yinhang Liu <[email protected]>
* Author: Wind Yuan <[email protected]>
*/
#include "test_common.h"
#include "test_inline.h"
#include <unistd.h>
#include <getopt.h>
#include <image_file_handle.h>
#include <calibration_parser.h>
#include <ocl/cl_device.h>
#include <ocl/cl_context.h>
#include <ocl/cl_fisheye_handler.h>
#include <ocl/cl_image_360_stitch.h>
#include <ocl/cl_utils.h>
#if HAVE_OPENCV
#include <ocl/cv_base_class.h>
#endif
#define XCAM_TEST_STITCH_DEBUG 0
#define XCAM_ALIGNED_WIDTH 16
#define CHECK_ACCESS(fliename) \
if (access (fliename, F_OK) != 0) { \
XCAM_LOG_ERROR ("%s not found", fliename); \
return false; \
}
using namespace XCam;
#if XCAM_TEST_STITCH_DEBUG
static void dbg_write_image (
SmartPtr<CLContext> context, SmartPtr<CLImage360Stitch> image_360,
SmartPtr<VideoBuffer> input_bufs[], SmartPtr<VideoBuffer> output_buf,
SmartPtr<VideoBuffer> top_view_buf, SmartPtr<VideoBuffer> rectified_view_buf,
bool all_in_one, int fisheye_num, int input_count);
#endif
static bool
parse_calibration_params (
IntrinsicParameter intrinsic_param[],
ExtrinsicParameter extrinsic_param[],
int fisheye_num)
{
CalibrationParser calib_parser;
char intrinsic_path[1024], extrinsic_path[1024];
for(int index = 0; index < fisheye_num; index++) {
switch (index) {
case 0:
strncpy (intrinsic_path, "./calib_params/intrinsic_camera_front.txt", 1023);
strncpy (extrinsic_path, "./calib_params/extrinsic_camera_front.txt", 1023);
break;
case 1:
strncpy (intrinsic_path, "./calib_params/intrinsic_camera_right.txt", 1023);
strncpy (extrinsic_path, "./calib_params/extrinsic_camera_right.txt", 1023);
break;
case 2:
strncpy (intrinsic_path, "./calib_params/intrinsic_camera_rear.txt", 1023);
strncpy (extrinsic_path, "./calib_params/extrinsic_camera_rear.txt", 1023);
break;
case 3:
strncpy (intrinsic_path, "./calib_params/intrinsic_camera_left.txt", 1023);
strncpy (extrinsic_path, "./calib_params/extrinsic_camera_left.txt", 1023);
break;
default:
XCAM_LOG_ERROR ("bowl view only support 4-camera mode");
return false;
}
CHECK_ACCESS (intrinsic_path);
CHECK_ACCESS (extrinsic_path);
if (!xcam_ret_is_ok (
calib_parser.parse_intrinsic_file (intrinsic_path, intrinsic_param[index]))) {
XCAM_LOG_ERROR ("parse fisheye:%d intrinsic file:%s failed.", index, intrinsic_path);
return false;
}
if (!xcam_ret_is_ok (
calib_parser.parse_extrinsic_file (extrinsic_path, extrinsic_param[index]))) {
XCAM_LOG_ERROR ("parse fisheye:%d extrinsic file:%s failed.", index, extrinsic_path);
return false;
}
extrinsic_param[index].trans_x += TEST_CAMERA_POSITION_OFFSET_X;
}
return true;
}
XCamReturn
read_file_to_video_buffer (
ImageFileHandle &file,
uint32_t width,
uint32_t height,
uint32_t row_pitch,
SmartPtr<VideoBuffer> &buf)
{
size_t size = row_pitch * height / 2 * 3;
uint8_t *nv12_mem = (uint8_t *) xcam_malloc0 (sizeof (uint8_t) * size);
XCAM_ASSERT (nv12_mem);
XCamReturn ret = file.read_file (nv12_mem, size);
if (ret != XCAM_RETURN_NO_ERROR) {
xcam_free (nv12_mem);
return ret;
}
uint32_t offset_uv = row_pitch * height;
convert_nv12_mem_to_video_buffer (nv12_mem, width, height, row_pitch, offset_uv, buf);
XCAM_ASSERT (buf.ptr ());
xcam_free (nv12_mem);
return XCAM_RETURN_NO_ERROR;
}
void usage(const char* arg0)
{
printf ("Usage:\n"
"%s --input file --output file\n"
"\t--input input image(NV12)\n"
"\t--output output image(NV12)\n"
"\t--input-w optional, input width, default: 1920\n"
"\t--input-h optional, input height, default: 1080\n"
"\t--output-w optional, output width, default: 1920\n"
"\t--output-h optional, output width, default: 960\n"
"\t--res-mode optional, image resolution mode, select from [1080p/1080p4/4k], default: 1080p\n"
"\t--surround-mode optional, stitching surround mode, select from [sphere, bowl], default: sphere\n"
"\t--scale-mode optional, image scaling mode, select from [local/global], default: local\n"
"\t--enable-seam optional, enable seam finder in blending area, default: no\n"
"\t--enable-fisheyemap optional, enable fisheye map, default: no\n"
"\t--enable-lsc optional, enable lens shading correction, default: no\n"
#if HAVE_OPENCV
"\t--fm-ocl optional, enable ocl for feature match, select from [true/false], default: false\n"
#endif
"\t--fisheye-num optional, the number of fisheye lens, default: 2\n"
"\t--all-in-one optional, all fisheye in one image, select from [true/false], default: true\n"
"\t--save optional, save file or not, select from [true/false], default: true\n"
"\t--framerate optional, framerate of saved video, default: 30.0\n"
"\t--loop optional, how many loops need to run for performance test, default: 1\n"
"\t--help usage\n",
arg0);
}
int main (int argc, char *argv[])
{
XCamReturn ret = XCAM_RETURN_NO_ERROR;
SmartPtr<CLContext> context;
SmartPtr<BufferPool> buf_pool[XCAM_STITCH_FISHEYE_MAX_NUM];
ImageFileHandle file_in[XCAM_STITCH_FISHEYE_MAX_NUM];
ImageFileHandle file_out;
SmartPtr<VideoBuffer> input_buf, output_buf, top_view_buf, rectified_view_buf;
VideoBufferInfo input_buf_info, output_buf_info, top_view_buf_info, rectified_view_buf_info;
SmartPtr<CLImage360Stitch> image_360;
uint32_t input_format = V4L2_PIX_FMT_NV12;
uint32_t input_width = 1920;
uint32_t input_height = 1080;
uint32_t output_height = 960;
uint32_t output_width = output_height * 2;
uint32_t top_view_width = 1920;
uint32_t top_view_height = 1080;
uint32_t rectified_view_width = 1920;
uint32_t rectified_view_height = 1080;
int loop = 1;
bool enable_seam = false;
bool enable_fisheye_map = false;
bool enable_lsc = false;
CLBlenderScaleMode scale_mode = CLBlenderScaleLocal;
StitchResMode res_mode = StitchRes1080P;
SurroundMode surround_mode = BowlView;
IntrinsicParameter intrinsic_param[XCAM_STITCH_FISHEYE_MAX_NUM];
ExtrinsicParameter extrinsic_param[XCAM_STITCH_FISHEYE_MAX_NUM];
#if HAVE_OPENCV
bool fm_ocl = false;
#endif
int fisheye_num = 2;
bool all_in_one = true;
bool need_save_output = true;
double framerate = 30.0;
const char *file_in_name[XCAM_STITCH_FISHEYE_MAX_NUM] = {NULL};
const char *file_out_name = NULL;
const char *top_view_filename = "top_view.mp4";
const char *rectified_view_filename = "rectified_view.mp4";
int input_count = 0;
const struct option long_opts[] = {
{"input", required_argument, NULL, 'i'},
{"output", required_argument, NULL, 'o'},
{"input-w", required_argument, NULL, 'w'},
{"input-h", required_argument, NULL, 'h'},
{"output-w", required_argument, NULL, 'W'},
{"output-h", required_argument, NULL, 'H'},
{"res-mode", required_argument, NULL, 'R'},
{"surround-mode", required_argument, NULL, 'r'},
{"scale-mode", required_argument, NULL, 'c'},
{"enable-seam", no_argument, NULL, 'S'},
{"enable-fisheyemap", no_argument, NULL, 'F'},
{"enable-lsc", no_argument, NULL, 'L'},
#if HAVE_OPENCV
{"fm-ocl", required_argument, NULL, 'O'},
#endif
{"fisheye-num", required_argument, NULL, 'N'},
{"all-in-one", required_argument, NULL, 'A'},
{"save", required_argument, NULL, 's'},
{"framerate", required_argument, NULL, 'f'},
{"loop", required_argument, NULL, 'l'},
{"help", no_argument, NULL, 'e'},
{NULL, 0, NULL, 0},
};
int opt = -1;
while ((opt = getopt_long(argc, argv, "", long_opts, NULL)) != -1) {
switch (opt) {
case 'i':
XCAM_ASSERT (optarg);
file_in_name[input_count] = optarg;
input_count++;
break;
case 'o':
XCAM_ASSERT (optarg);
file_out_name = optarg;
break;
case 'w':
input_width = atoi(optarg);
break;
case 'h':
input_height = atoi(optarg);
break;
case 'W':
output_width = atoi(optarg);
break;
case 'H':
output_height = atoi(optarg);
break;
case 'R':
if (!strcasecmp (optarg, "1080p"))
res_mode = StitchRes1080P;
else if (!strcasecmp (optarg, "1080p4"))
res_mode = StitchRes1080P4;
else if (!strcasecmp (optarg, "4k"))
res_mode = StitchRes4K;
else {
XCAM_LOG_ERROR ("incorrect resolution mode");
return -1;
}
break;
case 'r':
if (!strcasecmp (optarg, "sphere"))
surround_mode = SphereView;
else if(!strcasecmp (optarg, "bowl"))
surround_mode = BowlView;
else {
XCAM_LOG_ERROR ("incorrect surround mode");
return -1;
}
break;
case 'c':
if (!strcasecmp (optarg, "local"))
scale_mode = CLBlenderScaleLocal;
else if (!strcasecmp (optarg, "global"))
scale_mode = CLBlenderScaleGlobal;
else {
XCAM_LOG_ERROR ("incorrect scaling mode");
return -1;
}
break;
case 'S':
enable_seam = true;
break;
case 'F':
enable_fisheye_map = true;
break;
case 'L':
enable_lsc = true;
break;
#if HAVE_OPENCV
case 'O':
fm_ocl = (strcasecmp (optarg, "true") == 0 ? true : false);
break;
#endif
case 'N':
fisheye_num = atoi(optarg);
if (fisheye_num > XCAM_STITCH_FISHEYE_MAX_NUM) {
XCAM_LOG_ERROR ("fisheye number should not be greater than %d\n", XCAM_STITCH_FISHEYE_MAX_NUM);
return -1;
}
break;
case 'A':
all_in_one = (strcasecmp (optarg, "false") == 0 ? false : true);
break;
case 's':
need_save_output = (strcasecmp (optarg, "false") == 0 ? false : true);
break;
case 'f':
framerate = atof(optarg);
break;
case 'l':
loop = atoi(optarg);
break;
case 'e':
usage (argv[0]);
return -1;
default:
XCAM_LOG_ERROR ("getopt_long return unknown value:%c", opt);
usage (argv[0]);
return -1;
}
}
if (optind < argc || argc < 2) {
XCAM_LOG_ERROR ("unknown option %s", argv[optind]);
usage (argv[0]);
return -1;
}
if (!all_in_one && input_count != fisheye_num) {
XCAM_LOG_ERROR ("multiple-input mode: conflicting input number(%d) and fisheye number(%d)",
input_count, fisheye_num);
return -1;
}
for (int i = 0; i < input_count; i++) {
if (!file_in_name[i]) {
XCAM_LOG_ERROR ("input[%d] path is NULL", i);
return -1;
}
}
if (!file_out_name) {
XCAM_LOG_ERROR ("output path is NULL");
return -1;
}
output_width = XCAM_ALIGN_UP (output_width, XCAM_ALIGNED_WIDTH);
output_height = XCAM_ALIGN_UP (output_height, XCAM_ALIGNED_WIDTH);
// if (output_width != output_height * 2) {
// XCAM_LOG_ERROR ("incorrect output size width:%d height:%d", output_width, output_height);
// return -1;
// }
#if !HAVE_OPENCV
if (need_save_output) {
XCAM_LOG_WARNING ("non-OpenCV mode, can't save video");
need_save_output = false;
}
#endif
printf ("Description------------------------\n");
if (all_in_one)
printf ("input file:\t\t%s\n", file_in_name[0]);
else {
for (int i = 0; i < input_count; i++)
printf ("input file %d:\t\t%s\n", i, file_in_name[i]);
}
printf ("output file:\t\t%s\n", file_out_name);
printf ("input width:\t\t%d\n", input_width);
printf ("input height:\t\t%d\n", input_height);
printf ("output width:\t\t%d\n", output_width);
printf ("output height:\t\t%d\n", output_height);
printf ("resolution mode:\t%s\n",
res_mode == StitchRes1080P ? "1080P" : (res_mode == StitchRes1080P4 ? "1080P4" : "4K"));
printf ("surround mode: \t\t%s\n",
surround_mode == SphereView ? "sphere view" : "bowl view");
printf ("scale mode:\t\t%s\n", scale_mode == CLBlenderScaleLocal ? "local" : "global");
printf ("seam mask:\t\t%s\n", enable_seam ? "true" : "false");
printf ("fisheye map:\t\t%s\n", enable_fisheye_map ? "true" : "false");
printf ("shading correction:\t%s\n", enable_lsc ? "true" : "false");
#if HAVE_OPENCV
printf ("feature match ocl:\t%s\n", fm_ocl ? "true" : "false");
#endif
printf ("fisheye number:\t\t%d\n", fisheye_num);
printf ("all in one:\t\t%s\n", all_in_one ? "true" : "false");
printf ("save file:\t\t%s\n", need_save_output ? "true" : "false");
printf ("framerate:\t\t%.3lf\n", framerate);
printf ("loop count:\t\t%d\n", loop);
printf ("-----------------------------------\n");
context = CLDevice::instance ()->get_context ();
image_360 =
create_image_360_stitch (
context, enable_seam, scale_mode, enable_fisheye_map, enable_lsc, surround_mode,
res_mode, fisheye_num, all_in_one).dynamic_cast_ptr<CLImage360Stitch> ();
XCAM_ASSERT (image_360.ptr ());
image_360->set_output_size (output_width, output_height);
#if HAVE_OPENCV
image_360->set_feature_match_ocl (fm_ocl);
#endif
image_360->set_pool_type (CLImageHandler::CLVideoPoolType);
if (surround_mode == BowlView) {
parse_calibration_params (intrinsic_param, extrinsic_param, fisheye_num);
for (int i = 0; i < fisheye_num; i++) {
image_360->set_fisheye_intrinsic (intrinsic_param[i], i);
image_360->set_fisheye_extrinsic (extrinsic_param[i], i);
}
}
input_buf_info.init (input_format, input_width, input_height);
output_buf_info.init (input_format, output_width, output_height);
top_view_buf_info.init (input_format, top_view_width, top_view_height);
rectified_view_buf_info.init (input_format, rectified_view_width, rectified_view_height);
for (int i = 0; i < input_count; i++) {
buf_pool[i] = new CLVideoBufferPool ();
XCAM_ASSERT (buf_pool[i].ptr ());
buf_pool[i]->set_video_info (input_buf_info);
if (!buf_pool[i]->reserve (6)) {
XCAM_LOG_ERROR ("init buffer pool failed");
return -1;
}
}
SmartPtr<BufferPool> top_view_pool = new CLVideoBufferPool ();
XCAM_ASSERT (top_view_pool.ptr ());
top_view_pool->set_video_info (top_view_buf_info);
if (!top_view_pool->reserve (6)) {
XCAM_LOG_ERROR ("top-view-buffer pool reserve failed");
return -1;
}
top_view_buf = top_view_pool->get_buffer (top_view_pool);
SmartPtr<BufferPool> rectified_view_pool = new CLVideoBufferPool ();
XCAM_ASSERT (rectified_view_pool.ptr ());
rectified_view_pool->set_video_info (rectified_view_buf_info);
if (!rectified_view_pool->reserve (6)) {
XCAM_LOG_ERROR ("top-view-buffer pool reserve failed");
return -1;
}
rectified_view_buf = rectified_view_pool->get_buffer (rectified_view_pool);
for (int i = 0; i < input_count; i++) {
ret = file_in[i].open (file_in_name[i], "rb");
CHECK (ret, "open %s failed", file_in_name[i]);
}
#if HAVE_OPENCV
cv::VideoWriter writer;
cv::VideoWriter top_view_writer;
cv::VideoWriter rectified_view_writer;
if (need_save_output) {
cv::Size dst_size = cv::Size (output_width, output_height);
if (!writer.open (file_out_name, CV_FOURCC('X', '2', '6', '4'), framerate, dst_size)) {
XCAM_LOG_ERROR ("open file %s failed", file_out_name);
return -1;
}
dst_size = cv::Size (top_view_width, top_view_height);
if (!top_view_writer.open (top_view_filename, CV_FOURCC('X', '2', '6', '4'), framerate, dst_size)) {
XCAM_LOG_ERROR ("open file %s failed", top_view_filename);
return -1;
}
dst_size = cv::Size (rectified_view_width, rectified_view_height);
if (!rectified_view_writer.open (rectified_view_filename, CV_FOURCC('X', '2', '6', '4'), framerate, dst_size)) {
XCAM_LOG_ERROR ("open file %s failed", rectified_view_filename);
return -1;
}
}
#endif
SmartPtr<VideoBuffer> pre_buf, cur_buf;
#if (HAVE_OPENCV) && (XCAM_TEST_STITCH_DEBUG)
SmartPtr<VideoBuffer> input_bufs[XCAM_STITCH_FISHEYE_MAX_NUM];
#endif
int frame_id = 0;
std::vector<PointFloat2> top_view_map_table;
std::vector<PointFloat2> rectified_view_map_table;
float rectified_start_angle = -45.0f, rectified_end_angle = 45.0f;
while (loop--) {
for (int i = 0; i < input_count; i++) {
ret = file_in[i].rewind ();
CHECK (ret, "image_360 stitch rewind file(%s) failed", file_in_name[i]);
}
do {
for (int i = 0; i < input_count; i++) {
cur_buf = buf_pool[i]->get_buffer (buf_pool[i]);
XCAM_ASSERT (cur_buf.ptr ());
ret = file_in[i].read_buf (cur_buf);
// ret = read_file_to_video_buffer (file_in[i], input_width, input_height, input_width, cur_buf);
if (ret == XCAM_RETURN_BYPASS)
break;
if (ret == XCAM_RETURN_ERROR_FILE) {
XCAM_LOG_ERROR ("read buffer from %s failed", file_in_name[i]);
return -1;
}
if (i == 0)
input_buf = cur_buf;
else
pre_buf->attach_buffer (cur_buf);
pre_buf = cur_buf;
#if (HAVE_OPENCV) && (XCAM_TEST_STITCH_DEBUG)
input_bufs[i] = cur_buf;
#endif
}
if (ret == XCAM_RETURN_BYPASS)
break;
ret = image_360->execute (input_buf, output_buf);
CHECK (ret, "image_360 stitch execute failed");
#if HAVE_OPENCV
if (need_save_output) {
cv::Mat out_mat;
convert_to_mat (output_buf, out_mat);
writer.write (out_mat);
BowlDataConfig config = image_360->get_fisheye_bowl_config ();
cv::Mat top_view_mat;
sample_generate_top_view (output_buf, top_view_buf, config, top_view_map_table);
convert_to_mat (top_view_buf, top_view_mat);
top_view_writer.write (top_view_mat);
cv::Mat rectified_view_mat;
sample_generate_rectified_view (output_buf, rectified_view_buf, config, rectified_start_angle,
rectified_end_angle, rectified_view_map_table);
convert_to_mat (rectified_view_buf, rectified_view_mat);
rectified_view_writer.write (rectified_view_mat);
#if XCAM_TEST_STITCH_DEBUG
dbg_write_image (context, image_360, input_bufs, output_buf, top_view_buf, rectified_view_buf,
all_in_one, fisheye_num, input_count);
#endif
} else
#endif
ensure_gpu_buffer_done (output_buf);
frame_id++;
FPS_CALCULATION (image_stitching, XCAM_OBJ_DUR_FRAME_NUM);
} while (true);
}
return 0;
}
#if (HAVE_OPENCV) && (XCAM_TEST_STITCH_DEBUG)
static void dbg_write_image (
SmartPtr<CLContext> context, SmartPtr<CLImage360Stitch> image_360,
SmartPtr<VideoBuffer> input_bufs[], SmartPtr<VideoBuffer> output_buf,
SmartPtr<VideoBuffer> top_view_buf, SmartPtr<VideoBuffer> rectified_view_buf,
bool all_in_one, int fisheye_num, int input_count)
{
cv::Mat mat;
static int frame_count = 0;
char file_name [1024];
StitchInfo stitch_info = image_360->get_stitch_info ();
std::snprintf (file_name, 1023, "orig_fisheye_%d.jpg", frame_count);
for (int i = 0; i < input_count; i++) {
if (!all_in_one)
std::snprintf (file_name, 1023, "orig_fisheye_%d_%d.jpg", frame_count, i);
convert_to_mat (input_bufs[i], mat);
int fisheye_per_frame = all_in_one ? fisheye_num : 1;
for (int i = 0; i < fisheye_per_frame; i++) {
cv::circle (mat, cv::Point(stitch_info.fisheye_info[i].center_x, stitch_info.fisheye_info[i].center_y),
stitch_info.fisheye_info[i].radius, cv::Scalar(0, 0, 255), 2);
}
cv::imwrite (file_name, mat);
}
char frame_str[1024];
std::snprintf (frame_str, 1023, "%d", frame_count);
convert_to_mat (output_buf, mat);
cv::putText (mat, frame_str, cv::Point(120, 120), cv::FONT_HERSHEY_COMPLEX, 2.0,
cv::Scalar(0, 0, 255), 2, 8, false);
std::snprintf (file_name, 1023, "stitched_img_%d.jpg", frame_count);
cv::imwrite (file_name, mat);
convert_to_mat (top_view_buf, mat);
cv::putText (mat, frame_str, cv::Point(120, 120), cv::FONT_HERSHEY_COMPLEX, 2.0,
cv::Scalar(0, 0, 255), 2, 8, false);
std::snprintf (file_name, 1023, "top_view_img_%d.jpg", frame_count);
cv::imwrite (file_name, mat);
convert_to_mat (rectified_view_buf, mat);
cv::putText (mat, frame_str, cv::Point(120, 120), cv::FONT_HERSHEY_COMPLEX, 2.0,
cv::Scalar(0, 0, 255), 2, 8, false);
std::snprintf (file_name, 1023, "rectified_view_img_%d.jpg", frame_count);
cv::imwrite (file_name, mat);
frame_count++;
}
#endif