/* * cl_wavelet_denoise_handler.cpp - CL wavelet denoise handler * * Copyright (c) 2015 Intel Corporation * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. * * Author: Wei Zong <wei.zong@intel.com> */ #include "cl_utils.h" #include "x3a_stats_pool.h" #include "cl_context.h" #include "cl_device.h" #include "cl_wavelet_denoise_handler.h" #define WAVELET_DECOMPOSITION_LEVELS 4 namespace XCam { static const XCamKernelInfo kernel_wavelet_denoise_info = { "kernel_wavelet_denoise", #include "kernel_wavelet_denoise.clx" , 0, }; CLWaveletDenoiseImageKernel::CLWaveletDenoiseImageKernel ( const SmartPtr<CLContext> &context, const char *name, SmartPtr<CLWaveletDenoiseImageHandler> &handler, uint32_t channel, uint32_t layer) : CLImageKernel (context, name) , _channel (channel) , _current_layer (layer) , _handler (handler) { } XCamReturn CLWaveletDenoiseImageKernel::prepare_arguments ( CLArgList &args, CLWorkSize &work_size) { SmartPtr<CLContext> context = get_context (); SmartPtr<VideoBuffer> input = _handler->get_input_buf (); SmartPtr<VideoBuffer> output = _handler->get_output_buf (); const VideoBufferInfo &video_info_in = input->get_video_info (); const VideoBufferInfo &video_info_out = output->get_video_info (); SmartPtr<CLMemory> input_image = convert_to_clbuffer (context, input); SmartPtr<CLMemory> reconstruct_image = convert_to_clbuffer (context, output); SmartPtr<CLMemory> details_image = _handler->get_details_image (); SmartPtr<CLMemory> approx_image = _handler->get_approx_image (); uint32_t decomposition_levels = WAVELET_DECOMPOSITION_LEVELS; float soft_threshold = _handler->get_denoise_config ().threshold[0]; float hard_threshold = _handler->get_denoise_config ().threshold[1]; uint32_t input_y_offset = video_info_in.offsets[0] / 4; uint32_t output_y_offset = video_info_out.offsets[0] / 4; uint32_t input_uv_offset = video_info_in.aligned_height; uint32_t output_uv_offset = video_info_out.aligned_height; XCAM_FAIL_RETURN ( WARNING, input_image->is_valid () && reconstruct_image->is_valid (), XCAM_RETURN_ERROR_MEM, "cl image kernel(%s) in/out memory not available", XCAM_STR(get_kernel_name ())); //set args; work_size.dim = XCAM_DEFAULT_IMAGE_DIM; work_size.local[0] = 8; work_size.local[1] = 4; if (_current_layer % 2) { args.push_back (new CLMemArgument (input_image)); args.push_back (new CLMemArgument (approx_image)); } else { args.push_back (new CLMemArgument (approx_image)); args.push_back (new CLMemArgument (input_image)); } args.push_back (new CLMemArgument (details_image)); args.push_back (new CLMemArgument (reconstruct_image)); args.push_back (new CLArgumentT<uint32_t> (input_y_offset)); args.push_back (new CLArgumentT<uint32_t> (output_y_offset)); args.push_back (new CLArgumentT<uint32_t> (input_uv_offset)); args.push_back (new CLArgumentT<uint32_t> (output_uv_offset)); args.push_back (new CLArgumentT<uint32_t> (_current_layer)); args.push_back (new CLArgumentT<uint32_t> (decomposition_levels)); args.push_back (new CLArgumentT<float> (hard_threshold)); args.push_back (new CLArgumentT<float> (soft_threshold)); if (_channel & CL_IMAGE_CHANNEL_UV) { work_size.global[0] = video_info_in.width / 16; work_size.global[1] = video_info_in.height / 2; } else { work_size.global[0] = video_info_in.width / 16; work_size.global[1] = video_info_in.height; } return XCAM_RETURN_NO_ERROR; } CLWaveletDenoiseImageHandler::CLWaveletDenoiseImageHandler ( const SmartPtr<CLContext> &context, const char *name) : CLImageHandler (context, name) { _config.decomposition_levels = 5; _config.threshold[0] = 0.5; _config.threshold[1] = 5.0; } XCamReturn CLWaveletDenoiseImageHandler::prepare_output_buf (SmartPtr<VideoBuffer> &input, SmartPtr<VideoBuffer> &output) { XCamReturn ret = XCAM_RETURN_NO_ERROR; CLImageHandler::prepare_output_buf(input, output); if (!_approx_image.ptr ()) { const VideoBufferInfo & video_info = input->get_video_info (); uint32_t buffer_size = video_info.width * video_info.aligned_height; _approx_image = new CLBuffer (get_context (), buffer_size, CL_MEM_READ_WRITE | CL_MEM_ALLOC_HOST_PTR, NULL); } if (!_details_image.ptr ()) { const VideoBufferInfo & video_info = input->get_video_info (); uint32_t buffer_size = sizeof(float) * video_info.width * video_info.height; _details_image = new CLBuffer (get_context (), buffer_size, CL_MEM_READ_WRITE | CL_MEM_ALLOC_HOST_PTR, NULL); } return ret; } bool CLWaveletDenoiseImageHandler::set_denoise_config (const XCam3aResultWaveletNoiseReduction& config) { _config = config; return true; } SmartPtr<CLImageHandler> create_cl_wavelet_denoise_image_handler (const SmartPtr<CLContext> &context, uint32_t channel) { SmartPtr<CLWaveletDenoiseImageHandler> wavelet_handler; SmartPtr<CLWaveletDenoiseImageKernel> wavelet_kernel; wavelet_handler = new CLWaveletDenoiseImageHandler (context, "cl_handler_wavelet_denoise"); XCAM_ASSERT (wavelet_handler.ptr ()); for (int layer = 1; layer <= WAVELET_DECOMPOSITION_LEVELS; layer++) { wavelet_kernel = new CLWaveletDenoiseImageKernel ( context, "kernel_wavelet_denoise", wavelet_handler, channel, layer); const char *build_options = (channel & CL_IMAGE_CHANNEL_UV) ? "-DWAVELET_DENOISE_UV=1" : "-DWAVELET_DENOISE_UV=0"; XCAM_ASSERT (wavelet_kernel.ptr ()); XCAM_FAIL_RETURN ( ERROR, wavelet_kernel->build_kernel (kernel_wavelet_denoise_info, build_options) == XCAM_RETURN_NO_ERROR, NULL, "build wavelet denoise kernel(%s) failed", kernel_wavelet_denoise_info.kernel_name); XCAM_ASSERT (wavelet_kernel->is_valid ()); wavelet_handler->add_kernel (wavelet_kernel); } return wavelet_handler; } };