FFmpeg/libavfilter/dnn/dnn_io_proc.c

/*
 * Copyright (c) 2020
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

#include "dnn_io_proc.h"
#include "libavutil/imgutils.h"
#include "libswscale/swscale.h"
#include "libavutil/avassert.h"

DNNReturnType ff_proc_from_dnn_to_frame(AVFrame *frame, DNNData *output, void *log_ctx)
{
    struct SwsContext *sws_ctx;
    int bytewidth = av_image_get_linesize(frame->format, frame->width, 0);
    if (output->dt != DNN_FLOAT) {
        avpriv_report_missing_feature(log_ctx, "data type rather than DNN_FLOAT");
        return DNN_ERROR;
    }

    switch (frame->format) {
    case AV_PIX_FMT_RGB24:
    case AV_PIX_FMT_BGR24:
        sws_ctx = sws_getContext(frame->width * 3,
                                 frame->height,
                                 AV_PIX_FMT_GRAYF32,
                                 frame->width * 3,
                                 frame->height,
                                 AV_PIX_FMT_GRAY8,
                                 0, NULL, NULL, NULL);
        if (!sws_ctx) {
            av_log(log_ctx, AV_LOG_ERROR, "Impossible to create scale context for the conversion "
                "fmt:%s s:%dx%d -> fmt:%s s:%dx%d\n",
                av_get_pix_fmt_name(AV_PIX_FMT_GRAYF32), frame->width * 3, frame->height,
                av_get_pix_fmt_name(AV_PIX_FMT_GRAY8),   frame->width * 3, frame->height);
            return DNN_ERROR;
        }
        sws_scale(sws_ctx, (const uint8_t *[4]){(const uint8_t *)output->data, 0, 0, 0},
                           (const int[4]){frame->width * 3 * sizeof(float), 0, 0, 0}, 0, frame->height,
                           (uint8_t * const*)frame->data, frame->linesize);
        sws_freeContext(sws_ctx);
        return DNN_SUCCESS;
    case AV_PIX_FMT_GRAYF32:
        av_image_copy_plane(frame->data[0], frame->linesize[0],
                            output->data, bytewidth,
                            bytewidth, frame->height);
        return DNN_SUCCESS;
    case AV_PIX_FMT_YUV420P:
    case AV_PIX_FMT_YUV422P:
    case AV_PIX_FMT_YUV444P:
    case AV_PIX_FMT_YUV410P:
    case AV_PIX_FMT_YUV411P:
    case AV_PIX_FMT_GRAY8:
    case AV_PIX_FMT_NV12:
        sws_ctx = sws_getContext(frame->width,
                                 frame->height,
                                 AV_PIX_FMT_GRAYF32,
                                 frame->width,
                                 frame->height,
                                 AV_PIX_FMT_GRAY8,
                                 0, NULL, NULL, NULL);
        if (!sws_ctx) {
            av_log(log_ctx, AV_LOG_ERROR, "Impossible to create scale context for the conversion "
                "fmt:%s s:%dx%d -> fmt:%s s:%dx%d\n",
                av_get_pix_fmt_name(AV_PIX_FMT_GRAYF32), frame->width, frame->height,
                av_get_pix_fmt_name(AV_PIX_FMT_GRAY8),   frame->width, frame->height);
            return DNN_ERROR;
        }
        sws_scale(sws_ctx, (const uint8_t *[4]){(const uint8_t *)output->data, 0, 0, 0},
                           (const int[4]){frame->width * sizeof(float), 0, 0, 0}, 0, frame->height,
                           (uint8_t * const*)frame->data, frame->linesize);
        sws_freeContext(sws_ctx);
        return DNN_SUCCESS;
    default:
        avpriv_report_missing_feature(log_ctx, "%s", av_get_pix_fmt_name(frame->format));
        return DNN_ERROR;
    }

    return DNN_SUCCESS;
}

static DNNReturnType proc_from_frame_to_dnn_frameprocessing(AVFrame *frame, DNNData *input, void *log_ctx)
{
    struct SwsContext *sws_ctx;
    int bytewidth = av_image_get_linesize(frame->format, frame->width, 0);
    if (input->dt != DNN_FLOAT) {
        avpriv_report_missing_feature(log_ctx, "data type rather than DNN_FLOAT");
        return DNN_ERROR;
    }

    switch (frame->format) {
    case AV_PIX_FMT_RGB24:
    case AV_PIX_FMT_BGR24:
        sws_ctx = sws_getContext(frame->width * 3,
                                 frame->height,
                                 AV_PIX_FMT_GRAY8,
                                 frame->width * 3,
                                 frame->height,
                                 AV_PIX_FMT_GRAYF32,
                                 0, NULL, NULL, NULL);
        if (!sws_ctx) {
            av_log(log_ctx, AV_LOG_ERROR, "Impossible to create scale context for the conversion "
                "fmt:%s s:%dx%d -> fmt:%s s:%dx%d\n",
                av_get_pix_fmt_name(AV_PIX_FMT_GRAY8),  frame->width * 3, frame->height,
                av_get_pix_fmt_name(AV_PIX_FMT_GRAYF32),frame->width * 3, frame->height);
            return DNN_ERROR;
        }
        sws_scale(sws_ctx, (const uint8_t **)frame->data,
                           frame->linesize, 0, frame->height,
                           (uint8_t * const*)(&input->data),
                           (const int [4]){frame->width * 3 * sizeof(float), 0, 0, 0});
        sws_freeContext(sws_ctx);
        break;
    case AV_PIX_FMT_GRAYF32:
        av_image_copy_plane(input->data, bytewidth,
                            frame->data[0], frame->linesize[0],
                            bytewidth, frame->height);
        break;
    case AV_PIX_FMT_YUV420P:
    case AV_PIX_FMT_YUV422P:
    case AV_PIX_FMT_YUV444P:
    case AV_PIX_FMT_YUV410P:
    case AV_PIX_FMT_YUV411P:
    case AV_PIX_FMT_GRAY8:
    case AV_PIX_FMT_NV12:
        sws_ctx = sws_getContext(frame->width,
                                 frame->height,
                                 AV_PIX_FMT_GRAY8,
                                 frame->width,
                                 frame->height,
                                 AV_PIX_FMT_GRAYF32,
                                 0, NULL, NULL, NULL);
        if (!sws_ctx) {
            av_log(log_ctx, AV_LOG_ERROR, "Impossible to create scale context for the conversion "
                "fmt:%s s:%dx%d -> fmt:%s s:%dx%d\n",
                av_get_pix_fmt_name(AV_PIX_FMT_GRAY8),  frame->width, frame->height,
                av_get_pix_fmt_name(AV_PIX_FMT_GRAYF32),frame->width, frame->height);
            return DNN_ERROR;
        }
        sws_scale(sws_ctx, (const uint8_t **)frame->data,
                           frame->linesize, 0, frame->height,
                           (uint8_t * const*)(&input->data),
                           (const int [4]){frame->width * sizeof(float), 0, 0, 0});
        sws_freeContext(sws_ctx);
        break;
    default:
        avpriv_report_missing_feature(log_ctx, "%s", av_get_pix_fmt_name(frame->format));
        return DNN_ERROR;
    }

    return DNN_SUCCESS;
}

static enum AVPixelFormat get_pixel_format(DNNData *data)
{
    if (data->dt == DNN_UINT8 && data->order == DCO_BGR) {
        return AV_PIX_FMT_BGR24;
    }

    av_assert0(!"not supported yet.\n");
    return AV_PIX_FMT_BGR24;
}

static DNNReturnType proc_from_frame_to_dnn_analytics(AVFrame *frame, DNNData *input, void *log_ctx)
{
    struct SwsContext *sws_ctx;
    int linesizes[4];
    enum AVPixelFormat fmt = get_pixel_format(input);
    sws_ctx = sws_getContext(frame->width, frame->height, frame->format,
                             input->width, input->height, fmt,
                             SWS_FAST_BILINEAR, NULL, NULL, NULL);
    if (!sws_ctx) {
        av_log(log_ctx, AV_LOG_ERROR, "Impossible to create scale context for the conversion "
            "fmt:%s s:%dx%d -> fmt:%s s:%dx%d\n",
            av_get_pix_fmt_name(frame->format), frame->width, frame->height,
            av_get_pix_fmt_name(fmt), input->width, input->height);
        return DNN_ERROR;
    }

    if (av_image_fill_linesizes(linesizes, fmt, input->width) < 0) {
        av_log(log_ctx, AV_LOG_ERROR, "unable to get linesizes with av_image_fill_linesizes");
        sws_freeContext(sws_ctx);
        return DNN_ERROR;
    }

    sws_scale(sws_ctx, (const uint8_t *const *)frame->data, frame->linesize, 0, frame->height,
                       (uint8_t *const *)(&input->data), linesizes);

    sws_freeContext(sws_ctx);
    return DNN_SUCCESS;
}

DNNReturnType ff_proc_from_frame_to_dnn(AVFrame *frame, DNNData *input, DNNFunctionType func_type, void *log_ctx)
{
    switch (func_type)
    {
    case DFT_PROCESS_FRAME:
        return proc_from_frame_to_dnn_frameprocessing(frame, input, log_ctx);
    case DFT_ANALYTICS_DETECT:
        return proc_from_frame_to_dnn_analytics(frame, input, log_ctx);
    default:
        avpriv_report_missing_feature(log_ctx, "model function type %d", func_type);
        return DNN_ERROR;
    }
}
dnn: change dnn interface to replace DNNData* with AVFrame* Currently, every filter needs to provide code to transfer data from AVFrame* to model input (DNNData), and also from model output (DNNData) to AVFrame. Actually, such transfer can be implemented within DNN module, and so filter can focus on its own business logic. DNN module also exports the function pointer pre_proc and post_proc in struct DNNModel, just in case that a filter has its special logic to transfer data between AVFrame and DNNData*. The default implementation within DNN module is used if the filter does not set pre/post_proc. 2020-08-28 04:51:44 +00:00			`/*`
			`* Copyright (c) 2020`
			`*`
			`* This file is part of FFmpeg.`
			`*`
			`* FFmpeg is free software; you can redistribute it and/or`
			`* modify it under the terms of the GNU Lesser General Public`
			`* License as published by the Free Software Foundation; either`
			`* version 2.1 of the License, or (at your option) any later version.`
			`*`
			`* FFmpeg is distributed in the hope that it will be useful,`
			`* but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU`
			`* Lesser General Public License for more details.`
			`*`
			`* You should have received a copy of the GNU Lesser General Public`
			`* License along with FFmpeg; if not, write to the Free Software`
			`* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA`
			`*/`

			`#include "dnn_io_proc.h"`
			`#include "libavutil/imgutils.h"`
			`#include "libswscale/swscale.h"`
dnn: add color conversion for analytic case Signed-off-by: Guo, Yejun <yejun.guo@intel.com> 2021-02-07 07:03:43 +00:00			`#include "libavutil/avassert.h"`
dnn: change dnn interface to replace DNNData* with AVFrame* Currently, every filter needs to provide code to transfer data from AVFrame* to model input (DNNData), and also from model output (DNNData) to AVFrame. Actually, such transfer can be implemented within DNN module, and so filter can focus on its own business logic. DNN module also exports the function pointer pre_proc and post_proc in struct DNNModel, just in case that a filter has its special logic to transfer data between AVFrame and DNNData*. The default implementation within DNN module is used if the filter does not set pre/post_proc. 2020-08-28 04:51:44 +00:00
libavfilter/dnn: add prefix ff_ for internal functions from proc_from_frame_to_dnn to ff_proc_from_frame_to_dnn, and from proc_from_dnn_to_frame to ff_proc_from_dnn_to_frame. Signed-off-by: Guo, Yejun <yejun.guo@intel.com> 2021-01-18 08:00:58 +00:00			`DNNReturnType ff_proc_from_dnn_to_frame(AVFrame frame, DNNData output, void *log_ctx)`
dnn: change dnn interface to replace DNNData* with AVFrame* Currently, every filter needs to provide code to transfer data from AVFrame* to model input (DNNData), and also from model output (DNNData) to AVFrame. Actually, such transfer can be implemented within DNN module, and so filter can focus on its own business logic. DNN module also exports the function pointer pre_proc and post_proc in struct DNNModel, just in case that a filter has its special logic to transfer data between AVFrame and DNNData*. The default implementation within DNN module is used if the filter does not set pre/post_proc. 2020-08-28 04:51:44 +00:00			`{`
			`struct SwsContext *sws_ctx;`
			`int bytewidth = av_image_get_linesize(frame->format, frame->width, 0);`
			`if (output->dt != DNN_FLOAT) {`
libavfilter/dnn: use avpriv_report_missing_feature for unsupported features Signed-off-by: Guo, Yejun <yejun.guo@intel.com> 2021-01-18 07:56:34 +00:00			`avpriv_report_missing_feature(log_ctx, "data type rather than DNN_FLOAT");`
dnn: change dnn interface to replace DNNData* with AVFrame* Currently, every filter needs to provide code to transfer data from AVFrame* to model input (DNNData), and also from model output (DNNData) to AVFrame. Actually, such transfer can be implemented within DNN module, and so filter can focus on its own business logic. DNN module also exports the function pointer pre_proc and post_proc in struct DNNModel, just in case that a filter has its special logic to transfer data between AVFrame and DNNData*. The default implementation within DNN module is used if the filter does not set pre/post_proc. 2020-08-28 04:51:44 +00:00			`return DNN_ERROR;`
			`}`

			`switch (frame->format) {`
			`case AV_PIX_FMT_RGB24:`
			`case AV_PIX_FMT_BGR24:`
			`sws_ctx = sws_getContext(frame->width * 3,`
			`frame->height,`
			`AV_PIX_FMT_GRAYF32,`
			`frame->width * 3,`
			`frame->height,`
			`AV_PIX_FMT_GRAY8,`
			`0, NULL, NULL, NULL);`
lavfi/dnn: check the return value from sws_getContext sws_getContext may be return NULL, and it's will be dereferenced, so add the check. Signed-off-by: Jun Zhao <barryjzhao@tencent.com> 2020-12-09 09:53:10 +00:00			`if (!sws_ctx) {`
			`av_log(log_ctx, AV_LOG_ERROR, "Impossible to create scale context for the conversion "`
			`"fmt:%s s:%dx%d -> fmt:%s s:%dx%d\n",`
			`av_get_pix_fmt_name(AV_PIX_FMT_GRAYF32), frame->width * 3, frame->height,`
			`av_get_pix_fmt_name(AV_PIX_FMT_GRAY8), frame->width * 3, frame->height);`
			`return DNN_ERROR;`
			`}`
dnn: change dnn interface to replace DNNData* with AVFrame* Currently, every filter needs to provide code to transfer data from AVFrame* to model input (DNNData), and also from model output (DNNData) to AVFrame. Actually, such transfer can be implemented within DNN module, and so filter can focus on its own business logic. DNN module also exports the function pointer pre_proc and post_proc in struct DNNModel, just in case that a filter has its special logic to transfer data between AVFrame and DNNData*. The default implementation within DNN module is used if the filter does not set pre/post_proc. 2020-08-28 04:51:44 +00:00			`sws_scale(sws_ctx, (const uint8_t [4]){(const uint8_t )output->data, 0, 0, 0},`
			`(const int[4]){frame->width * 3 * sizeof(float), 0, 0, 0}, 0, frame->height,`
			`(uint8_t * const*)frame->data, frame->linesize);`
			`sws_freeContext(sws_ctx);`
			`return DNN_SUCCESS;`
			`case AV_PIX_FMT_GRAYF32:`
			`av_image_copy_plane(frame->data[0], frame->linesize[0],`
			`output->data, bytewidth,`
			`bytewidth, frame->height);`
			`return DNN_SUCCESS;`
			`case AV_PIX_FMT_YUV420P:`
			`case AV_PIX_FMT_YUV422P:`
			`case AV_PIX_FMT_YUV444P:`
			`case AV_PIX_FMT_YUV410P:`
			`case AV_PIX_FMT_YUV411P:`
			`case AV_PIX_FMT_GRAY8:`
dnn: add NV12 pixel format support Signed-off-by: Ting Fu <ting.fu@intel.com> Signed-off-by: Guo, Yejun <yejun.guo@intel.com> 2020-12-18 08:08:29 +00:00			`case AV_PIX_FMT_NV12:`
dnn: change dnn interface to replace DNNData* with AVFrame* Currently, every filter needs to provide code to transfer data from AVFrame* to model input (DNNData), and also from model output (DNNData) to AVFrame. Actually, such transfer can be implemented within DNN module, and so filter can focus on its own business logic. DNN module also exports the function pointer pre_proc and post_proc in struct DNNModel, just in case that a filter has its special logic to transfer data between AVFrame and DNNData*. The default implementation within DNN module is used if the filter does not set pre/post_proc. 2020-08-28 04:51:44 +00:00			`sws_ctx = sws_getContext(frame->width,`
			`frame->height,`
			`AV_PIX_FMT_GRAYF32,`
			`frame->width,`
			`frame->height,`
			`AV_PIX_FMT_GRAY8,`
			`0, NULL, NULL, NULL);`
lavfi/dnn: check the return value from sws_getContext sws_getContext may be return NULL, and it's will be dereferenced, so add the check. Signed-off-by: Jun Zhao <barryjzhao@tencent.com> 2020-12-09 09:53:10 +00:00			`if (!sws_ctx) {`
			`av_log(log_ctx, AV_LOG_ERROR, "Impossible to create scale context for the conversion "`
			`"fmt:%s s:%dx%d -> fmt:%s s:%dx%d\n",`
			`av_get_pix_fmt_name(AV_PIX_FMT_GRAYF32), frame->width, frame->height,`
			`av_get_pix_fmt_name(AV_PIX_FMT_GRAY8), frame->width, frame->height);`
			`return DNN_ERROR;`
			`}`
dnn: change dnn interface to replace DNNData* with AVFrame* Currently, every filter needs to provide code to transfer data from AVFrame* to model input (DNNData), and also from model output (DNNData) to AVFrame. Actually, such transfer can be implemented within DNN module, and so filter can focus on its own business logic. DNN module also exports the function pointer pre_proc and post_proc in struct DNNModel, just in case that a filter has its special logic to transfer data between AVFrame and DNNData*. The default implementation within DNN module is used if the filter does not set pre/post_proc. 2020-08-28 04:51:44 +00:00			`sws_scale(sws_ctx, (const uint8_t [4]){(const uint8_t )output->data, 0, 0, 0},`
			`(const int[4]){frame->width * sizeof(float), 0, 0, 0}, 0, frame->height,`
			`(uint8_t * const*)frame->data, frame->linesize);`
			`sws_freeContext(sws_ctx);`
			`return DNN_SUCCESS;`
			`default:`
libavfilter/dnn: use avpriv_report_missing_feature for unsupported features Signed-off-by: Guo, Yejun <yejun.guo@intel.com> 2021-01-18 07:56:34 +00:00			`avpriv_report_missing_feature(log_ctx, "%s", av_get_pix_fmt_name(frame->format));`
dnn: change dnn interface to replace DNNData* with AVFrame* Currently, every filter needs to provide code to transfer data from AVFrame* to model input (DNNData), and also from model output (DNNData) to AVFrame. Actually, such transfer can be implemented within DNN module, and so filter can focus on its own business logic. DNN module also exports the function pointer pre_proc and post_proc in struct DNNModel, just in case that a filter has its special logic to transfer data between AVFrame and DNNData*. The default implementation within DNN module is used if the filter does not set pre/post_proc. 2020-08-28 04:51:44 +00:00			`return DNN_ERROR;`
			`}`

			`return DNN_SUCCESS;`
			`}`

dnn: add color conversion for analytic case Signed-off-by: Guo, Yejun <yejun.guo@intel.com> 2021-02-07 07:03:43 +00:00			`static DNNReturnType proc_from_frame_to_dnn_frameprocessing(AVFrame frame, DNNData input, void *log_ctx)`
dnn: change dnn interface to replace DNNData* with AVFrame* Currently, every filter needs to provide code to transfer data from AVFrame* to model input (DNNData), and also from model output (DNNData) to AVFrame. Actually, such transfer can be implemented within DNN module, and so filter can focus on its own business logic. DNN module also exports the function pointer pre_proc and post_proc in struct DNNModel, just in case that a filter has its special logic to transfer data between AVFrame and DNNData*. The default implementation within DNN module is used if the filter does not set pre/post_proc. 2020-08-28 04:51:44 +00:00			`{`
			`struct SwsContext *sws_ctx;`
			`int bytewidth = av_image_get_linesize(frame->format, frame->width, 0);`
			`if (input->dt != DNN_FLOAT) {`
libavfilter/dnn: use avpriv_report_missing_feature for unsupported features Signed-off-by: Guo, Yejun <yejun.guo@intel.com> 2021-01-18 07:56:34 +00:00			`avpriv_report_missing_feature(log_ctx, "data type rather than DNN_FLOAT");`
dnn: change dnn interface to replace DNNData* with AVFrame* Currently, every filter needs to provide code to transfer data from AVFrame* to model input (DNNData), and also from model output (DNNData) to AVFrame. Actually, such transfer can be implemented within DNN module, and so filter can focus on its own business logic. DNN module also exports the function pointer pre_proc and post_proc in struct DNNModel, just in case that a filter has its special logic to transfer data between AVFrame and DNNData*. The default implementation within DNN module is used if the filter does not set pre/post_proc. 2020-08-28 04:51:44 +00:00			`return DNN_ERROR;`
			`}`

			`switch (frame->format) {`
			`case AV_PIX_FMT_RGB24:`
			`case AV_PIX_FMT_BGR24:`
			`sws_ctx = sws_getContext(frame->width * 3,`
			`frame->height,`
			`AV_PIX_FMT_GRAY8,`
			`frame->width * 3,`
			`frame->height,`
			`AV_PIX_FMT_GRAYF32,`
			`0, NULL, NULL, NULL);`
lavfi/dnn: check the return value from sws_getContext sws_getContext may be return NULL, and it's will be dereferenced, so add the check. Signed-off-by: Jun Zhao <barryjzhao@tencent.com> 2020-12-09 09:53:10 +00:00			`if (!sws_ctx) {`
			`av_log(log_ctx, AV_LOG_ERROR, "Impossible to create scale context for the conversion "`
			`"fmt:%s s:%dx%d -> fmt:%s s:%dx%d\n",`
			`av_get_pix_fmt_name(AV_PIX_FMT_GRAY8), frame->width * 3, frame->height,`
			`av_get_pix_fmt_name(AV_PIX_FMT_GRAYF32),frame->width * 3, frame->height);`
			`return DNN_ERROR;`
			`}`
dnn: change dnn interface to replace DNNData* with AVFrame* Currently, every filter needs to provide code to transfer data from AVFrame* to model input (DNNData), and also from model output (DNNData) to AVFrame. Actually, such transfer can be implemented within DNN module, and so filter can focus on its own business logic. DNN module also exports the function pointer pre_proc and post_proc in struct DNNModel, just in case that a filter has its special logic to transfer data between AVFrame and DNNData*. The default implementation within DNN module is used if the filter does not set pre/post_proc. 2020-08-28 04:51:44 +00:00			`sws_scale(sws_ctx, (const uint8_t **)frame->data,`
			`frame->linesize, 0, frame->height,`
			`(uint8_t * const*)(&input->data),`
			`(const int [4]){frame->width * 3 * sizeof(float), 0, 0, 0});`
			`sws_freeContext(sws_ctx);`
			`break;`
			`case AV_PIX_FMT_GRAYF32:`
			`av_image_copy_plane(input->data, bytewidth,`
			`frame->data[0], frame->linesize[0],`
			`bytewidth, frame->height);`
			`break;`
			`case AV_PIX_FMT_YUV420P:`
			`case AV_PIX_FMT_YUV422P:`
			`case AV_PIX_FMT_YUV444P:`
			`case AV_PIX_FMT_YUV410P:`
			`case AV_PIX_FMT_YUV411P:`
			`case AV_PIX_FMT_GRAY8:`
dnn: add NV12 pixel format support Signed-off-by: Ting Fu <ting.fu@intel.com> Signed-off-by: Guo, Yejun <yejun.guo@intel.com> 2020-12-18 08:08:29 +00:00			`case AV_PIX_FMT_NV12:`
dnn: change dnn interface to replace DNNData* with AVFrame* Currently, every filter needs to provide code to transfer data from AVFrame* to model input (DNNData), and also from model output (DNNData) to AVFrame. Actually, such transfer can be implemented within DNN module, and so filter can focus on its own business logic. DNN module also exports the function pointer pre_proc and post_proc in struct DNNModel, just in case that a filter has its special logic to transfer data between AVFrame and DNNData*. The default implementation within DNN module is used if the filter does not set pre/post_proc. 2020-08-28 04:51:44 +00:00			`sws_ctx = sws_getContext(frame->width,`
			`frame->height,`
			`AV_PIX_FMT_GRAY8,`
			`frame->width,`
			`frame->height,`
			`AV_PIX_FMT_GRAYF32,`
			`0, NULL, NULL, NULL);`
lavfi/dnn: check the return value from sws_getContext sws_getContext may be return NULL, and it's will be dereferenced, so add the check. Signed-off-by: Jun Zhao <barryjzhao@tencent.com> 2020-12-09 09:53:10 +00:00			`if (!sws_ctx) {`
			`av_log(log_ctx, AV_LOG_ERROR, "Impossible to create scale context for the conversion "`
			`"fmt:%s s:%dx%d -> fmt:%s s:%dx%d\n",`
			`av_get_pix_fmt_name(AV_PIX_FMT_GRAY8), frame->width, frame->height,`
			`av_get_pix_fmt_name(AV_PIX_FMT_GRAYF32),frame->width, frame->height);`
			`return DNN_ERROR;`
			`}`
dnn: change dnn interface to replace DNNData* with AVFrame* Currently, every filter needs to provide code to transfer data from AVFrame* to model input (DNNData), and also from model output (DNNData) to AVFrame. Actually, such transfer can be implemented within DNN module, and so filter can focus on its own business logic. DNN module also exports the function pointer pre_proc and post_proc in struct DNNModel, just in case that a filter has its special logic to transfer data between AVFrame and DNNData*. The default implementation within DNN module is used if the filter does not set pre/post_proc. 2020-08-28 04:51:44 +00:00			`sws_scale(sws_ctx, (const uint8_t **)frame->data,`
			`frame->linesize, 0, frame->height,`
			`(uint8_t * const*)(&input->data),`
			`(const int [4]){frame->width * sizeof(float), 0, 0, 0});`
			`sws_freeContext(sws_ctx);`
			`break;`
			`default:`
libavfilter/dnn: use avpriv_report_missing_feature for unsupported features Signed-off-by: Guo, Yejun <yejun.guo@intel.com> 2021-01-18 07:56:34 +00:00			`avpriv_report_missing_feature(log_ctx, "%s", av_get_pix_fmt_name(frame->format));`
dnn: change dnn interface to replace DNNData* with AVFrame* Currently, every filter needs to provide code to transfer data from AVFrame* to model input (DNNData), and also from model output (DNNData) to AVFrame. Actually, such transfer can be implemented within DNN module, and so filter can focus on its own business logic. DNN module also exports the function pointer pre_proc and post_proc in struct DNNModel, just in case that a filter has its special logic to transfer data between AVFrame and DNNData*. The default implementation within DNN module is used if the filter does not set pre/post_proc. 2020-08-28 04:51:44 +00:00			`return DNN_ERROR;`
			`}`

			`return DNN_SUCCESS;`
			`}`
dnn: add color conversion for analytic case Signed-off-by: Guo, Yejun <yejun.guo@intel.com> 2021-02-07 07:03:43 +00:00
			`static enum AVPixelFormat get_pixel_format(DNNData *data)`
			`{`
			`if (data->dt == DNN_UINT8 && data->order == DCO_BGR) {`
			`return AV_PIX_FMT_BGR24;`
			`}`

			`av_assert0(!"not supported yet.\n");`
			`return AV_PIX_FMT_BGR24;`
			`}`

			`static DNNReturnType proc_from_frame_to_dnn_analytics(AVFrame frame, DNNData input, void *log_ctx)`
			`{`
			`struct SwsContext *sws_ctx;`
			`int linesizes[4];`
			`enum AVPixelFormat fmt = get_pixel_format(input);`
			`sws_ctx = sws_getContext(frame->width, frame->height, frame->format,`
			`input->width, input->height, fmt,`
			`SWS_FAST_BILINEAR, NULL, NULL, NULL);`
			`if (!sws_ctx) {`
			`av_log(log_ctx, AV_LOG_ERROR, "Impossible to create scale context for the conversion "`
			`"fmt:%s s:%dx%d -> fmt:%s s:%dx%d\n",`
			`av_get_pix_fmt_name(frame->format), frame->width, frame->height,`
			`av_get_pix_fmt_name(fmt), input->width, input->height);`
			`return DNN_ERROR;`
			`}`

			`if (av_image_fill_linesizes(linesizes, fmt, input->width) < 0) {`
			`av_log(log_ctx, AV_LOG_ERROR, "unable to get linesizes with av_image_fill_linesizes");`
			`sws_freeContext(sws_ctx);`
			`return DNN_ERROR;`
			`}`

			`sws_scale(sws_ctx, (const uint8_t const )frame->data, frame->linesize, 0, frame->height,`
			`(uint8_t const )(&input->data), linesizes);`

			`sws_freeContext(sws_ctx);`
			`return DNN_SUCCESS;`
			`}`

			`DNNReturnType ff_proc_from_frame_to_dnn(AVFrame frame, DNNData input, DNNFunctionType func_type, void *log_ctx)`
			`{`
			`switch (func_type)`
			`{`
			`case DFT_PROCESS_FRAME:`
			`return proc_from_frame_to_dnn_frameprocessing(frame, input, log_ctx);`
			`case DFT_ANALYTICS_DETECT:`
			`return proc_from_frame_to_dnn_analytics(frame, input, log_ctx);`
			`default:`
			`avpriv_report_missing_feature(log_ctx, "model function type %d", func_type);`
			`return DNN_ERROR;`
			`}`
			`}`