C++程序  |  254行  |  7.42 KB

/*
 * cl_csc_handler.cpp - CL csc handler
 *
 *  Copyright (c) 2015 Intel Corporation
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 *
 * Author: wangfei <feix.w.wang@intel.com>
 * Author: Wind Yuan <feng.yuan@intel.com>
 */
#include "cl_utils.h"
#include "cl_csc_handler.h"
#include "cl_device.h"
#include "cl_kernel.h"

static const XCamKernelInfo kernel_csc_info[] = {
    {
        "kernel_csc_rgbatonv12",
#include "kernel_csc.clx"
        , 0,
    },
    {
        "kernel_csc_rgbatolab",
#include "kernel_csc.clx"
        , 0,
    },
    {
        "kernel_csc_rgba64torgba",
#include "kernel_csc.clx"
        , 0,
    },
    {
        "kernel_csc_yuyvtorgba",
#include "kernel_csc.clx"
        , 0,
    },
    {
        "kernel_csc_nv12torgba",
#include "kernel_csc.clx"
        , 0,
    },
};


float default_rgbtoyuv_matrix[XCAM_COLOR_MATRIX_SIZE] = {
    0.299f, 0.587f, 0.114f,
    -0.14713f, -0.28886f, 0.436f,
    0.615f, -0.51499f, -0.10001f
};

namespace XCam {

CLCscImageKernel::CLCscImageKernel (const SmartPtr<CLContext> &context, CLCscType type)
    : CLImageKernel (context)
    , _kernel_csc_type (type)
{
}

CLCscImageHandler::CLCscImageHandler (
    const SmartPtr<CLContext> &context, const char *name, CLCscType type)
    : CLImageHandler (context, name)
    , _output_format (V4L2_PIX_FMT_NV12)
    , _csc_type (type)
{
    memcpy (_rgbtoyuv_matrix, default_rgbtoyuv_matrix, sizeof (_rgbtoyuv_matrix));

    switch (type) {
    case CL_CSC_TYPE_RGBATONV12:
        _output_format = V4L2_PIX_FMT_NV12;
        break;
    case CL_CSC_TYPE_RGBATOLAB:
        _output_format = XCAM_PIX_FMT_LAB;
        break;
    case CL_CSC_TYPE_RGBA64TORGBA:
    case CL_CSC_TYPE_YUYVTORGBA:
    case CL_CSC_TYPE_NV12TORGBA:
        _output_format = V4L2_PIX_FMT_RGBA32;
        break;
    default:
        break;
    }
}

bool
CLCscImageHandler::set_csc_kernel (SmartPtr<CLCscImageKernel> &kernel)
{
    SmartPtr<CLImageKernel> image_kernel = kernel;
    add_kernel (image_kernel);
    _csc_kernel = kernel;
    return true;
}

bool
CLCscImageHandler::set_matrix (const XCam3aResultColorMatrix &matrix)
{
    for (int i = 0; i < XCAM_COLOR_MATRIX_SIZE; i++)
        _rgbtoyuv_matrix[i] = (float)matrix.matrix[i];
    return true;
}

bool
CLCscImageHandler::set_output_format (uint32_t fourcc)
{
    XCAM_FAIL_RETURN (
        WARNING,
        V4L2_PIX_FMT_XBGR32 == fourcc || V4L2_PIX_FMT_NV12 == fourcc,
        false,
        "CL csc handler doesn't support format: (%s)",
        xcam_fourcc_to_string (fourcc));

    _output_format = fourcc;
    return true;
}

XCamReturn
CLCscImageHandler::prepare_buffer_pool_video_info (
    const VideoBufferInfo &input,
    VideoBufferInfo &output)
{
    bool format_inited = output.init (_output_format, input.width, input.height);

    XCAM_FAIL_RETURN (
        WARNING,
        format_inited,
        XCAM_RETURN_ERROR_PARAM,
        "CL image handler(%s) output format(%s) unsupported",
        get_name (), xcam_fourcc_to_string (_output_format));

    return XCAM_RETURN_NO_ERROR;
}

static bool
ensure_image_desc (const VideoBufferInfo &info, CLImageDesc &desc)
{
    desc.array_size = 0;
    desc.slice_pitch = 0;
    if (info.format == XCAM_PIX_FMT_RGB48_planar || info.format == XCAM_PIX_FMT_RGB24_planar)
        desc.height = info.aligned_height * 3;

    return true;
}

XCamReturn
CLCscImageHandler::prepare_parameters (SmartPtr<VideoBuffer> &input, SmartPtr<VideoBuffer> &output)
{
    SmartPtr<CLContext> context = get_context ();

    const VideoBufferInfo &in_video_info = input->get_video_info ();
    const VideoBufferInfo &out_video_info = output->get_video_info ();
    CLArgList args;
    CLWorkSize work_size;
    XCamReturn ret = XCAM_RETURN_NO_ERROR;

    XCAM_ASSERT (_csc_kernel.ptr ());

    CLImageDesc in_desc, out_desc;
    CLImage::video_info_2_cl_image_desc (in_video_info, in_desc);
    CLImage::video_info_2_cl_image_desc (out_video_info, out_desc);
    ensure_image_desc (in_video_info, in_desc);
    ensure_image_desc (out_video_info, out_desc);

    SmartPtr<CLImage> image_in  = convert_to_climage (context, input, in_desc, in_video_info.offsets[0]);
    SmartPtr<CLImage> image_out  = convert_to_climage (context, output, out_desc, out_video_info.offsets[0]);
    SmartPtr<CLBuffer> matrix_buffer = new CLBuffer (
        context, sizeof(float)*XCAM_COLOR_MATRIX_SIZE,
        CL_MEM_READ_WRITE | CL_MEM_USE_HOST_PTR , &_rgbtoyuv_matrix);

    XCAM_FAIL_RETURN (
        WARNING,
        image_in->is_valid () && image_out->is_valid () && matrix_buffer->is_valid(),
        XCAM_RETURN_ERROR_MEM,
        "cl image kernel(%s) in/out memory not available", _csc_kernel->get_kernel_name ());

    work_size.dim = XCAM_DEFAULT_IMAGE_DIM;
    work_size.local[0] = 4;
    work_size.local[1] = 4;

    args.push_back (new CLMemArgument (image_in));
    args.push_back (new CLMemArgument (image_out));

    do {
        if ((_csc_type == CL_CSC_TYPE_RGBATOLAB)
                || (_csc_type == CL_CSC_TYPE_RGBA64TORGBA)
                || (_csc_type == CL_CSC_TYPE_YUYVTORGBA)) {
            work_size.global[0] = out_video_info.width;
            work_size.global[1] = out_video_info.height;
            break;
        }

        SmartPtr<CLImage> image_uv;
        if(_csc_type == CL_CSC_TYPE_NV12TORGBA) {
            in_desc.height /= 2;
            image_uv = convert_to_climage (context, input, in_desc, in_video_info.offsets[1]);
            args.push_back (new CLMemArgument (image_uv));

            work_size.global[0] = out_video_info.width / 2;
            work_size.global[1] = out_video_info.height / 2;
            break;
        }

        if (_csc_type == CL_CSC_TYPE_RGBATONV12) {
            out_desc.height /= 2;
            image_uv = convert_to_climage (context, output, out_desc, out_video_info.offsets[1]);
            args.push_back (new CLMemArgument (image_uv));
            args.push_back (new CLMemArgument (matrix_buffer));

            work_size.global[0] = out_video_info.width / 2;
            work_size.global[1] = out_video_info.height / 2;
            break;
        }
    } while (0);

    XCAM_ASSERT (_csc_kernel.ptr ());
    ret = _csc_kernel->set_arguments (args, work_size);
    XCAM_FAIL_RETURN (
        WARNING, ret == XCAM_RETURN_NO_ERROR, ret,
        "csc kernel set arguments failed.");

    return XCAM_RETURN_NO_ERROR;
}

SmartPtr<CLImageHandler>
create_cl_csc_image_handler (const SmartPtr<CLContext> &context, CLCscType type)
{
    SmartPtr<CLCscImageHandler> csc_handler;
    SmartPtr<CLCscImageKernel> csc_kernel;

    XCAM_ASSERT (type < CL_CSC_TYPE_MAX);
    csc_kernel = new CLCscImageKernel (context, type);
    XCAM_ASSERT (csc_kernel.ptr ());
    XCAM_FAIL_RETURN (
        ERROR, csc_kernel->build_kernel (kernel_csc_info[type], NULL) == XCAM_RETURN_NO_ERROR, NULL,
        "build csc kernel(%s) failed", kernel_csc_info[type].kernel_name);

    XCAM_ASSERT (csc_kernel->is_valid ());

    csc_handler = new CLCscImageHandler (context, "cl_handler_csc", type);
    csc_handler->set_csc_kernel (csc_kernel);

    return csc_handler;
}

};