/* * test-image-stitching.cpp - test image stitching * * Copyright (c) 2016 Intel Corporation * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. * * Author: Yinhang Liu <yinhangx.liu@intel.com> * Author: Wind Yuan <feng.yuan@intel.com> */ #include "test_common.h" #include "test_inline.h" #include <unistd.h> #include <getopt.h> #include <image_file_handle.h> #include <calibration_parser.h> #include <ocl/cl_device.h> #include <ocl/cl_context.h> #include <ocl/cl_fisheye_handler.h> #include <ocl/cl_image_360_stitch.h> #include <ocl/cl_utils.h> #if HAVE_OPENCV #include <ocl/cv_base_class.h> #endif #define XCAM_TEST_STITCH_DEBUG 0 #define XCAM_ALIGNED_WIDTH 16 #define CHECK_ACCESS(fliename) \ if (access (fliename, F_OK) != 0) { \ XCAM_LOG_ERROR ("%s not found", fliename); \ return false; \ } using namespace XCam; #if XCAM_TEST_STITCH_DEBUG static void dbg_write_image ( SmartPtr<CLContext> context, SmartPtr<CLImage360Stitch> image_360, SmartPtr<VideoBuffer> input_bufs[], SmartPtr<VideoBuffer> output_buf, SmartPtr<VideoBuffer> top_view_buf, SmartPtr<VideoBuffer> rectified_view_buf, bool all_in_one, int fisheye_num, int input_count); #endif static bool parse_calibration_params ( IntrinsicParameter intrinsic_param[], ExtrinsicParameter extrinsic_param[], int fisheye_num) { CalibrationParser calib_parser; char intrinsic_path[1024], extrinsic_path[1024]; for(int index = 0; index < fisheye_num; index++) { switch (index) { case 0: strncpy (intrinsic_path, "./calib_params/intrinsic_camera_front.txt", 1023); strncpy (extrinsic_path, "./calib_params/extrinsic_camera_front.txt", 1023); break; case 1: strncpy (intrinsic_path, "./calib_params/intrinsic_camera_right.txt", 1023); strncpy (extrinsic_path, "./calib_params/extrinsic_camera_right.txt", 1023); break; case 2: strncpy (intrinsic_path, "./calib_params/intrinsic_camera_rear.txt", 1023); strncpy (extrinsic_path, "./calib_params/extrinsic_camera_rear.txt", 1023); break; case 3: strncpy (intrinsic_path, "./calib_params/intrinsic_camera_left.txt", 1023); strncpy (extrinsic_path, "./calib_params/extrinsic_camera_left.txt", 1023); break; default: XCAM_LOG_ERROR ("bowl view only support 4-camera mode"); return false; } CHECK_ACCESS (intrinsic_path); CHECK_ACCESS (extrinsic_path); if (!xcam_ret_is_ok ( calib_parser.parse_intrinsic_file (intrinsic_path, intrinsic_param[index]))) { XCAM_LOG_ERROR ("parse fisheye:%d intrinsic file:%s failed.", index, intrinsic_path); return false; } if (!xcam_ret_is_ok ( calib_parser.parse_extrinsic_file (extrinsic_path, extrinsic_param[index]))) { XCAM_LOG_ERROR ("parse fisheye:%d extrinsic file:%s failed.", index, extrinsic_path); return false; } extrinsic_param[index].trans_x += TEST_CAMERA_POSITION_OFFSET_X; } return true; } XCamReturn read_file_to_video_buffer ( ImageFileHandle &file, uint32_t width, uint32_t height, uint32_t row_pitch, SmartPtr<VideoBuffer> &buf) { size_t size = row_pitch * height / 2 * 3; uint8_t *nv12_mem = (uint8_t *) xcam_malloc0 (sizeof (uint8_t) * size); XCAM_ASSERT (nv12_mem); XCamReturn ret = file.read_file (nv12_mem, size); if (ret != XCAM_RETURN_NO_ERROR) { xcam_free (nv12_mem); return ret; } uint32_t offset_uv = row_pitch * height; convert_nv12_mem_to_video_buffer (nv12_mem, width, height, row_pitch, offset_uv, buf); XCAM_ASSERT (buf.ptr ()); xcam_free (nv12_mem); return XCAM_RETURN_NO_ERROR; } void usage(const char* arg0) { printf ("Usage:\n" "%s --input file --output file\n" "\t--input input image(NV12)\n" "\t--output output image(NV12)\n" "\t--input-w optional, input width, default: 1920\n" "\t--input-h optional, input height, default: 1080\n" "\t--output-w optional, output width, default: 1920\n" "\t--output-h optional, output width, default: 960\n" "\t--res-mode optional, image resolution mode, select from [1080p/1080p4/4k], default: 1080p\n" "\t--surround-mode optional, stitching surround mode, select from [sphere, bowl], default: sphere\n" "\t--scale-mode optional, image scaling mode, select from [local/global], default: local\n" "\t--enable-seam optional, enable seam finder in blending area, default: no\n" "\t--enable-fisheyemap optional, enable fisheye map, default: no\n" "\t--enable-lsc optional, enable lens shading correction, default: no\n" #if HAVE_OPENCV "\t--fm-ocl optional, enable ocl for feature match, select from [true/false], default: false\n" #endif "\t--fisheye-num optional, the number of fisheye lens, default: 2\n" "\t--all-in-one optional, all fisheye in one image, select from [true/false], default: true\n" "\t--save optional, save file or not, select from [true/false], default: true\n" "\t--framerate optional, framerate of saved video, default: 30.0\n" "\t--loop optional, how many loops need to run for performance test, default: 1\n" "\t--help usage\n", arg0); } int main (int argc, char *argv[]) { XCamReturn ret = XCAM_RETURN_NO_ERROR; SmartPtr<CLContext> context; SmartPtr<BufferPool> buf_pool[XCAM_STITCH_FISHEYE_MAX_NUM]; ImageFileHandle file_in[XCAM_STITCH_FISHEYE_MAX_NUM]; ImageFileHandle file_out; SmartPtr<VideoBuffer> input_buf, output_buf, top_view_buf, rectified_view_buf; VideoBufferInfo input_buf_info, output_buf_info, top_view_buf_info, rectified_view_buf_info; SmartPtr<CLImage360Stitch> image_360; uint32_t input_format = V4L2_PIX_FMT_NV12; uint32_t input_width = 1920; uint32_t input_height = 1080; uint32_t output_height = 960; uint32_t output_width = output_height * 2; uint32_t top_view_width = 1920; uint32_t top_view_height = 1080; uint32_t rectified_view_width = 1920; uint32_t rectified_view_height = 1080; int loop = 1; bool enable_seam = false; bool enable_fisheye_map = false; bool enable_lsc = false; CLBlenderScaleMode scale_mode = CLBlenderScaleLocal; StitchResMode res_mode = StitchRes1080P; SurroundMode surround_mode = BowlView; IntrinsicParameter intrinsic_param[XCAM_STITCH_FISHEYE_MAX_NUM]; ExtrinsicParameter extrinsic_param[XCAM_STITCH_FISHEYE_MAX_NUM]; #if HAVE_OPENCV bool fm_ocl = false; #endif int fisheye_num = 2; bool all_in_one = true; bool need_save_output = true; double framerate = 30.0; const char *file_in_name[XCAM_STITCH_FISHEYE_MAX_NUM] = {NULL}; const char *file_out_name = NULL; const char *top_view_filename = "top_view.mp4"; const char *rectified_view_filename = "rectified_view.mp4"; int input_count = 0; const struct option long_opts[] = { {"input", required_argument, NULL, 'i'}, {"output", required_argument, NULL, 'o'}, {"input-w", required_argument, NULL, 'w'}, {"input-h", required_argument, NULL, 'h'}, {"output-w", required_argument, NULL, 'W'}, {"output-h", required_argument, NULL, 'H'}, {"res-mode", required_argument, NULL, 'R'}, {"surround-mode", required_argument, NULL, 'r'}, {"scale-mode", required_argument, NULL, 'c'}, {"enable-seam", no_argument, NULL, 'S'}, {"enable-fisheyemap", no_argument, NULL, 'F'}, {"enable-lsc", no_argument, NULL, 'L'}, #if HAVE_OPENCV {"fm-ocl", required_argument, NULL, 'O'}, #endif {"fisheye-num", required_argument, NULL, 'N'}, {"all-in-one", required_argument, NULL, 'A'}, {"save", required_argument, NULL, 's'}, {"framerate", required_argument, NULL, 'f'}, {"loop", required_argument, NULL, 'l'}, {"help", no_argument, NULL, 'e'}, {NULL, 0, NULL, 0}, }; int opt = -1; while ((opt = getopt_long(argc, argv, "", long_opts, NULL)) != -1) { switch (opt) { case 'i': XCAM_ASSERT (optarg); file_in_name[input_count] = optarg; input_count++; break; case 'o': XCAM_ASSERT (optarg); file_out_name = optarg; break; case 'w': input_width = atoi(optarg); break; case 'h': input_height = atoi(optarg); break; case 'W': output_width = atoi(optarg); break; case 'H': output_height = atoi(optarg); break; case 'R': if (!strcasecmp (optarg, "1080p")) res_mode = StitchRes1080P; else if (!strcasecmp (optarg, "1080p4")) res_mode = StitchRes1080P4; else if (!strcasecmp (optarg, "4k")) res_mode = StitchRes4K; else { XCAM_LOG_ERROR ("incorrect resolution mode"); return -1; } break; case 'r': if (!strcasecmp (optarg, "sphere")) surround_mode = SphereView; else if(!strcasecmp (optarg, "bowl")) surround_mode = BowlView; else { XCAM_LOG_ERROR ("incorrect surround mode"); return -1; } break; case 'c': if (!strcasecmp (optarg, "local")) scale_mode = CLBlenderScaleLocal; else if (!strcasecmp (optarg, "global")) scale_mode = CLBlenderScaleGlobal; else { XCAM_LOG_ERROR ("incorrect scaling mode"); return -1; } break; case 'S': enable_seam = true; break; case 'F': enable_fisheye_map = true; break; case 'L': enable_lsc = true; break; #if HAVE_OPENCV case 'O': fm_ocl = (strcasecmp (optarg, "true") == 0 ? true : false); break; #endif case 'N': fisheye_num = atoi(optarg); if (fisheye_num > XCAM_STITCH_FISHEYE_MAX_NUM) { XCAM_LOG_ERROR ("fisheye number should not be greater than %d\n", XCAM_STITCH_FISHEYE_MAX_NUM); return -1; } break; case 'A': all_in_one = (strcasecmp (optarg, "false") == 0 ? false : true); break; case 's': need_save_output = (strcasecmp (optarg, "false") == 0 ? false : true); break; case 'f': framerate = atof(optarg); break; case 'l': loop = atoi(optarg); break; case 'e': usage (argv[0]); return -1; default: XCAM_LOG_ERROR ("getopt_long return unknown value:%c", opt); usage (argv[0]); return -1; } } if (optind < argc || argc < 2) { XCAM_LOG_ERROR ("unknown option %s", argv[optind]); usage (argv[0]); return -1; } if (!all_in_one && input_count != fisheye_num) { XCAM_LOG_ERROR ("multiple-input mode: conflicting input number(%d) and fisheye number(%d)", input_count, fisheye_num); return -1; } for (int i = 0; i < input_count; i++) { if (!file_in_name[i]) { XCAM_LOG_ERROR ("input[%d] path is NULL", i); return -1; } } if (!file_out_name) { XCAM_LOG_ERROR ("output path is NULL"); return -1; } output_width = XCAM_ALIGN_UP (output_width, XCAM_ALIGNED_WIDTH); output_height = XCAM_ALIGN_UP (output_height, XCAM_ALIGNED_WIDTH); // if (output_width != output_height * 2) { // XCAM_LOG_ERROR ("incorrect output size width:%d height:%d", output_width, output_height); // return -1; // } #if !HAVE_OPENCV if (need_save_output) { XCAM_LOG_WARNING ("non-OpenCV mode, can't save video"); need_save_output = false; } #endif printf ("Description------------------------\n"); if (all_in_one) printf ("input file:\t\t%s\n", file_in_name[0]); else { for (int i = 0; i < input_count; i++) printf ("input file %d:\t\t%s\n", i, file_in_name[i]); } printf ("output file:\t\t%s\n", file_out_name); printf ("input width:\t\t%d\n", input_width); printf ("input height:\t\t%d\n", input_height); printf ("output width:\t\t%d\n", output_width); printf ("output height:\t\t%d\n", output_height); printf ("resolution mode:\t%s\n", res_mode == StitchRes1080P ? "1080P" : (res_mode == StitchRes1080P4 ? "1080P4" : "4K")); printf ("surround mode: \t\t%s\n", surround_mode == SphereView ? "sphere view" : "bowl view"); printf ("scale mode:\t\t%s\n", scale_mode == CLBlenderScaleLocal ? "local" : "global"); printf ("seam mask:\t\t%s\n", enable_seam ? "true" : "false"); printf ("fisheye map:\t\t%s\n", enable_fisheye_map ? "true" : "false"); printf ("shading correction:\t%s\n", enable_lsc ? "true" : "false"); #if HAVE_OPENCV printf ("feature match ocl:\t%s\n", fm_ocl ? "true" : "false"); #endif printf ("fisheye number:\t\t%d\n", fisheye_num); printf ("all in one:\t\t%s\n", all_in_one ? "true" : "false"); printf ("save file:\t\t%s\n", need_save_output ? "true" : "false"); printf ("framerate:\t\t%.3lf\n", framerate); printf ("loop count:\t\t%d\n", loop); printf ("-----------------------------------\n"); context = CLDevice::instance ()->get_context (); image_360 = create_image_360_stitch ( context, enable_seam, scale_mode, enable_fisheye_map, enable_lsc, surround_mode, res_mode, fisheye_num, all_in_one).dynamic_cast_ptr<CLImage360Stitch> (); XCAM_ASSERT (image_360.ptr ()); image_360->set_output_size (output_width, output_height); #if HAVE_OPENCV image_360->set_feature_match_ocl (fm_ocl); #endif image_360->set_pool_type (CLImageHandler::CLVideoPoolType); if (surround_mode == BowlView) { parse_calibration_params (intrinsic_param, extrinsic_param, fisheye_num); for (int i = 0; i < fisheye_num; i++) { image_360->set_fisheye_intrinsic (intrinsic_param[i], i); image_360->set_fisheye_extrinsic (extrinsic_param[i], i); } } input_buf_info.init (input_format, input_width, input_height); output_buf_info.init (input_format, output_width, output_height); top_view_buf_info.init (input_format, top_view_width, top_view_height); rectified_view_buf_info.init (input_format, rectified_view_width, rectified_view_height); for (int i = 0; i < input_count; i++) { buf_pool[i] = new CLVideoBufferPool (); XCAM_ASSERT (buf_pool[i].ptr ()); buf_pool[i]->set_video_info (input_buf_info); if (!buf_pool[i]->reserve (6)) { XCAM_LOG_ERROR ("init buffer pool failed"); return -1; } } SmartPtr<BufferPool> top_view_pool = new CLVideoBufferPool (); XCAM_ASSERT (top_view_pool.ptr ()); top_view_pool->set_video_info (top_view_buf_info); if (!top_view_pool->reserve (6)) { XCAM_LOG_ERROR ("top-view-buffer pool reserve failed"); return -1; } top_view_buf = top_view_pool->get_buffer (top_view_pool); SmartPtr<BufferPool> rectified_view_pool = new CLVideoBufferPool (); XCAM_ASSERT (rectified_view_pool.ptr ()); rectified_view_pool->set_video_info (rectified_view_buf_info); if (!rectified_view_pool->reserve (6)) { XCAM_LOG_ERROR ("top-view-buffer pool reserve failed"); return -1; } rectified_view_buf = rectified_view_pool->get_buffer (rectified_view_pool); for (int i = 0; i < input_count; i++) { ret = file_in[i].open (file_in_name[i], "rb"); CHECK (ret, "open %s failed", file_in_name[i]); } #if HAVE_OPENCV cv::VideoWriter writer; cv::VideoWriter top_view_writer; cv::VideoWriter rectified_view_writer; if (need_save_output) { cv::Size dst_size = cv::Size (output_width, output_height); if (!writer.open (file_out_name, CV_FOURCC('X', '2', '6', '4'), framerate, dst_size)) { XCAM_LOG_ERROR ("open file %s failed", file_out_name); return -1; } dst_size = cv::Size (top_view_width, top_view_height); if (!top_view_writer.open (top_view_filename, CV_FOURCC('X', '2', '6', '4'), framerate, dst_size)) { XCAM_LOG_ERROR ("open file %s failed", top_view_filename); return -1; } dst_size = cv::Size (rectified_view_width, rectified_view_height); if (!rectified_view_writer.open (rectified_view_filename, CV_FOURCC('X', '2', '6', '4'), framerate, dst_size)) { XCAM_LOG_ERROR ("open file %s failed", rectified_view_filename); return -1; } } #endif SmartPtr<VideoBuffer> pre_buf, cur_buf; #if (HAVE_OPENCV) && (XCAM_TEST_STITCH_DEBUG) SmartPtr<VideoBuffer> input_bufs[XCAM_STITCH_FISHEYE_MAX_NUM]; #endif int frame_id = 0; std::vector<PointFloat2> top_view_map_table; std::vector<PointFloat2> rectified_view_map_table; float rectified_start_angle = -45.0f, rectified_end_angle = 45.0f; while (loop--) { for (int i = 0; i < input_count; i++) { ret = file_in[i].rewind (); CHECK (ret, "image_360 stitch rewind file(%s) failed", file_in_name[i]); } do { for (int i = 0; i < input_count; i++) { cur_buf = buf_pool[i]->get_buffer (buf_pool[i]); XCAM_ASSERT (cur_buf.ptr ()); ret = file_in[i].read_buf (cur_buf); // ret = read_file_to_video_buffer (file_in[i], input_width, input_height, input_width, cur_buf); if (ret == XCAM_RETURN_BYPASS) break; if (ret == XCAM_RETURN_ERROR_FILE) { XCAM_LOG_ERROR ("read buffer from %s failed", file_in_name[i]); return -1; } if (i == 0) input_buf = cur_buf; else pre_buf->attach_buffer (cur_buf); pre_buf = cur_buf; #if (HAVE_OPENCV) && (XCAM_TEST_STITCH_DEBUG) input_bufs[i] = cur_buf; #endif } if (ret == XCAM_RETURN_BYPASS) break; ret = image_360->execute (input_buf, output_buf); CHECK (ret, "image_360 stitch execute failed"); #if HAVE_OPENCV if (need_save_output) { cv::Mat out_mat; convert_to_mat (output_buf, out_mat); writer.write (out_mat); BowlDataConfig config = image_360->get_fisheye_bowl_config (); cv::Mat top_view_mat; sample_generate_top_view (output_buf, top_view_buf, config, top_view_map_table); convert_to_mat (top_view_buf, top_view_mat); top_view_writer.write (top_view_mat); cv::Mat rectified_view_mat; sample_generate_rectified_view (output_buf, rectified_view_buf, config, rectified_start_angle, rectified_end_angle, rectified_view_map_table); convert_to_mat (rectified_view_buf, rectified_view_mat); rectified_view_writer.write (rectified_view_mat); #if XCAM_TEST_STITCH_DEBUG dbg_write_image (context, image_360, input_bufs, output_buf, top_view_buf, rectified_view_buf, all_in_one, fisheye_num, input_count); #endif } else #endif ensure_gpu_buffer_done (output_buf); frame_id++; FPS_CALCULATION (image_stitching, XCAM_OBJ_DUR_FRAME_NUM); } while (true); } return 0; } #if (HAVE_OPENCV) && (XCAM_TEST_STITCH_DEBUG) static void dbg_write_image ( SmartPtr<CLContext> context, SmartPtr<CLImage360Stitch> image_360, SmartPtr<VideoBuffer> input_bufs[], SmartPtr<VideoBuffer> output_buf, SmartPtr<VideoBuffer> top_view_buf, SmartPtr<VideoBuffer> rectified_view_buf, bool all_in_one, int fisheye_num, int input_count) { cv::Mat mat; static int frame_count = 0; char file_name [1024]; StitchInfo stitch_info = image_360->get_stitch_info (); std::snprintf (file_name, 1023, "orig_fisheye_%d.jpg", frame_count); for (int i = 0; i < input_count; i++) { if (!all_in_one) std::snprintf (file_name, 1023, "orig_fisheye_%d_%d.jpg", frame_count, i); convert_to_mat (input_bufs[i], mat); int fisheye_per_frame = all_in_one ? fisheye_num : 1; for (int i = 0; i < fisheye_per_frame; i++) { cv::circle (mat, cv::Point(stitch_info.fisheye_info[i].center_x, stitch_info.fisheye_info[i].center_y), stitch_info.fisheye_info[i].radius, cv::Scalar(0, 0, 255), 2); } cv::imwrite (file_name, mat); } char frame_str[1024]; std::snprintf (frame_str, 1023, "%d", frame_count); convert_to_mat (output_buf, mat); cv::putText (mat, frame_str, cv::Point(120, 120), cv::FONT_HERSHEY_COMPLEX, 2.0, cv::Scalar(0, 0, 255), 2, 8, false); std::snprintf (file_name, 1023, "stitched_img_%d.jpg", frame_count); cv::imwrite (file_name, mat); convert_to_mat (top_view_buf, mat); cv::putText (mat, frame_str, cv::Point(120, 120), cv::FONT_HERSHEY_COMPLEX, 2.0, cv::Scalar(0, 0, 255), 2, 8, false); std::snprintf (file_name, 1023, "top_view_img_%d.jpg", frame_count); cv::imwrite (file_name, mat); convert_to_mat (rectified_view_buf, mat); cv::putText (mat, frame_str, cv::Point(120, 120), cv::FONT_HERSHEY_COMPLEX, 2.0, cv::Scalar(0, 0, 255), 2, 8, false); std::snprintf (file_name, 1023, "rectified_view_img_%d.jpg", frame_count); cv::imwrite (file_name, mat); frame_count++; } #endif