| /** |
| * Copyright (c) 2016 Davinder Singh (DSM_) <ds.mudhar<@gmail.com> |
| * |
| * This file is part of FFmpeg. |
| * |
| * FFmpeg is free software; you can redistribute it and/or |
| * modify it under the terms of the GNU Lesser General Public |
| * License as published by the Free Software Foundation; either |
| * version 2.1 of the License, or (at your option) any later version. |
| * |
| * FFmpeg is distributed in the hope that it will be useful, |
| * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| * Lesser General Public License for more details. |
| * |
| * You should have received a copy of the GNU Lesser General Public |
| * License along with FFmpeg; if not, write to the Free Software |
| * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
| */ |
| |
| #include "motion_estimation.h" |
| #include "libavcodec/mathops.h" |
| #include "libavutil/avassert.h" |
| #include "libavutil/common.h" |
| #include "libavutil/imgutils.h" |
| #include "libavutil/opt.h" |
| #include "libavutil/pixdesc.h" |
| #include "libavutil/motion_vector.h" |
| #include "avfilter.h" |
| #include "formats.h" |
| #include "internal.h" |
| #include "video.h" |
| |
| typedef struct MEContext { |
| const AVClass *class; |
| AVMotionEstContext me_ctx; |
| int method; ///< motion estimation method |
| |
| int mb_size; ///< macroblock size |
| int search_param; ///< search parameter |
| int b_width, b_height, b_count; |
| int log2_mb_size; |
| |
| AVFrame *prev, *cur, *next; |
| |
| int (*mv_table[3])[2][2]; ///< motion vectors of current & prev 2 frames |
| } MEContext; |
| |
| #define OFFSET(x) offsetof(MEContext, x) |
| #define FLAGS AV_OPT_FLAG_VIDEO_PARAM|AV_OPT_FLAG_FILTERING_PARAM |
| #define CONST(name, help, val, unit) { name, help, 0, AV_OPT_TYPE_CONST, {.i64=val}, 0, 0, FLAGS, unit } |
| |
| static const AVOption mestimate_options[] = { |
| { "method", "motion estimation method", OFFSET(method), AV_OPT_TYPE_INT, {.i64 = AV_ME_METHOD_ESA}, AV_ME_METHOD_ESA, AV_ME_METHOD_UMH, FLAGS, "method" }, |
| CONST("esa", "exhaustive search", AV_ME_METHOD_ESA, "method"), |
| CONST("tss", "three step search", AV_ME_METHOD_TSS, "method"), |
| CONST("tdls", "two dimensional logarithmic search", AV_ME_METHOD_TDLS, "method"), |
| CONST("ntss", "new three step search", AV_ME_METHOD_NTSS, "method"), |
| CONST("fss", "four step search", AV_ME_METHOD_FSS, "method"), |
| CONST("ds", "diamond search", AV_ME_METHOD_DS, "method"), |
| CONST("hexbs", "hexagon-based search", AV_ME_METHOD_HEXBS, "method"), |
| CONST("epzs", "enhanced predictive zonal search", AV_ME_METHOD_EPZS, "method"), |
| CONST("umh", "uneven multi-hexagon search", AV_ME_METHOD_UMH, "method"), |
| { "mb_size", "macroblock size", OFFSET(mb_size), AV_OPT_TYPE_INT, {.i64 = 16}, 8, INT_MAX, FLAGS }, |
| { "search_param", "search parameter", OFFSET(search_param), AV_OPT_TYPE_INT, {.i64 = 7}, 4, INT_MAX, FLAGS }, |
| { NULL } |
| }; |
| |
| AVFILTER_DEFINE_CLASS(mestimate); |
| |
| static int query_formats(AVFilterContext *ctx) |
| { |
| static const enum AVPixelFormat pix_fmts[] = { |
| AV_PIX_FMT_YUV410P, AV_PIX_FMT_YUV411P, |
| AV_PIX_FMT_YUV420P, AV_PIX_FMT_YUV422P, |
| AV_PIX_FMT_YUV440P, AV_PIX_FMT_YUV444P, |
| AV_PIX_FMT_YUVJ444P, AV_PIX_FMT_YUVJ440P, |
| AV_PIX_FMT_YUVJ422P, AV_PIX_FMT_YUVJ420P, |
| AV_PIX_FMT_YUVJ411P, |
| AV_PIX_FMT_YUVA420P, AV_PIX_FMT_YUVA422P, AV_PIX_FMT_YUVA444P, |
| AV_PIX_FMT_GRAY8, |
| AV_PIX_FMT_NONE |
| }; |
| |
| AVFilterFormats *fmts_list = ff_make_format_list(pix_fmts); |
| if (!fmts_list) |
| return AVERROR(ENOMEM); |
| return ff_set_common_formats(ctx, fmts_list); |
| } |
| |
| static int config_input(AVFilterLink *inlink) |
| { |
| MEContext *s = inlink->dst->priv; |
| int i; |
| |
| s->log2_mb_size = av_ceil_log2_c(s->mb_size); |
| s->mb_size = 1 << s->log2_mb_size; |
| |
| s->b_width = inlink->w >> s->log2_mb_size; |
| s->b_height = inlink->h >> s->log2_mb_size; |
| s->b_count = s->b_width * s->b_height; |
| |
| for (i = 0; i < 3; i++) { |
| s->mv_table[i] = av_mallocz_array(s->b_count, sizeof(*s->mv_table[0])); |
| if (!s->mv_table[i]) |
| return AVERROR(ENOMEM); |
| } |
| |
| ff_me_init_context(&s->me_ctx, s->mb_size, s->search_param, inlink->w, inlink->h, 0, (s->b_width - 1) << s->log2_mb_size, 0, (s->b_height - 1) << s->log2_mb_size); |
| |
| return 0; |
| } |
| |
| static void add_mv_data(AVMotionVector *mv, int mb_size, |
| int x, int y, int x_mv, int y_mv, int dir) |
| { |
| mv->w = mb_size; |
| mv->h = mb_size; |
| mv->dst_x = x + (mb_size >> 1); |
| mv->dst_y = y + (mb_size >> 1); |
| mv->src_x = x_mv + (mb_size >> 1); |
| mv->src_y = y_mv + (mb_size >> 1); |
| mv->source = dir ? 1 : -1; |
| mv->flags = 0; |
| } |
| |
| #define SEARCH_MV(method)\ |
| do {\ |
| for (mb_y = 0; mb_y < s->b_height; mb_y++)\ |
| for (mb_x = 0; mb_x < s->b_width; mb_x++) {\ |
| const int x_mb = mb_x << s->log2_mb_size;\ |
| const int y_mb = mb_y << s->log2_mb_size;\ |
| int mv[2] = {x_mb, y_mb};\ |
| ff_me_search_##method(me_ctx, x_mb, y_mb, mv);\ |
| add_mv_data(((AVMotionVector *) sd->data) + mv_count++, me_ctx->mb_size, x_mb, y_mb, mv[0], mv[1], dir);\ |
| }\ |
| } while (0) |
| |
| #define ADD_PRED(preds, px, py)\ |
| do {\ |
| preds.mvs[preds.nb][0] = px;\ |
| preds.mvs[preds.nb][1] = py;\ |
| preds.nb++;\ |
| } while(0) |
| |
| static int filter_frame(AVFilterLink *inlink, AVFrame *frame) |
| { |
| AVFilterContext *ctx = inlink->dst; |
| MEContext *s = ctx->priv; |
| AVMotionEstContext *me_ctx = &s->me_ctx; |
| AVFrameSideData *sd; |
| AVFrame *out; |
| int mb_x, mb_y, dir; |
| int32_t mv_count = 0; |
| int ret; |
| |
| if (frame->pts == AV_NOPTS_VALUE) { |
| ret = ff_filter_frame(ctx->outputs[0], frame); |
| return ret; |
| } |
| |
| av_frame_free(&s->prev); |
| s->prev = s->cur; |
| s->cur = s->next; |
| s->next = frame; |
| |
| s->mv_table[2] = memcpy(s->mv_table[2], s->mv_table[1], sizeof(*s->mv_table[1]) * s->b_count); |
| s->mv_table[1] = memcpy(s->mv_table[1], s->mv_table[0], sizeof(*s->mv_table[0]) * s->b_count); |
| |
| if (!s->cur) { |
| s->cur = av_frame_clone(frame); |
| if (!s->cur) |
| return AVERROR(ENOMEM); |
| } |
| |
| if (!s->prev) |
| return 0; |
| |
| out = av_frame_clone(s->cur); |
| if (!out) |
| return AVERROR(ENOMEM); |
| |
| sd = av_frame_new_side_data(out, AV_FRAME_DATA_MOTION_VECTORS, 2 * s->b_count * sizeof(AVMotionVector)); |
| if (!sd) { |
| av_frame_free(&out); |
| return AVERROR(ENOMEM); |
| } |
| |
| me_ctx->data_cur = s->cur->data[0]; |
| me_ctx->linesize = s->cur->linesize[0]; |
| |
| for (dir = 0; dir < 2; dir++) { |
| me_ctx->data_ref = (dir ? s->next : s->prev)->data[0]; |
| |
| if (s->method == AV_ME_METHOD_DS) |
| SEARCH_MV(ds); |
| else if (s->method == AV_ME_METHOD_ESA) |
| SEARCH_MV(esa); |
| else if (s->method == AV_ME_METHOD_FSS) |
| SEARCH_MV(fss); |
| else if (s->method == AV_ME_METHOD_NTSS) |
| SEARCH_MV(ntss); |
| else if (s->method == AV_ME_METHOD_TDLS) |
| SEARCH_MV(tdls); |
| else if (s->method == AV_ME_METHOD_TSS) |
| SEARCH_MV(tss); |
| else if (s->method == AV_ME_METHOD_HEXBS) |
| SEARCH_MV(hexbs); |
| else if (s->method == AV_ME_METHOD_UMH) { |
| for (mb_y = 0; mb_y < s->b_height; mb_y++) |
| for (mb_x = 0; mb_x < s->b_width; mb_x++) { |
| const int mb_i = mb_x + mb_y * s->b_width; |
| const int x_mb = mb_x << s->log2_mb_size; |
| const int y_mb = mb_y << s->log2_mb_size; |
| int mv[2] = {x_mb, y_mb}; |
| |
| AVMotionEstPredictor *preds = me_ctx->preds; |
| preds[0].nb = 0; |
| |
| ADD_PRED(preds[0], 0, 0); |
| |
| //left mb in current frame |
| if (mb_x > 0) |
| ADD_PRED(preds[0], s->mv_table[0][mb_i - 1][dir][0], s->mv_table[0][mb_i - 1][dir][1]); |
| |
| if (mb_y > 0) { |
| //top mb in current frame |
| ADD_PRED(preds[0], s->mv_table[0][mb_i - s->b_width][dir][0], s->mv_table[0][mb_i - s->b_width][dir][1]); |
| |
| //top-right mb in current frame |
| if (mb_x + 1 < s->b_width) |
| ADD_PRED(preds[0], s->mv_table[0][mb_i - s->b_width + 1][dir][0], s->mv_table[0][mb_i - s->b_width + 1][dir][1]); |
| //top-left mb in current frame |
| else if (mb_x > 0) |
| ADD_PRED(preds[0], s->mv_table[0][mb_i - s->b_width - 1][dir][0], s->mv_table[0][mb_i - s->b_width - 1][dir][1]); |
| } |
| |
| //median predictor |
| if (preds[0].nb == 4) { |
| me_ctx->pred_x = mid_pred(preds[0].mvs[1][0], preds[0].mvs[2][0], preds[0].mvs[3][0]); |
| me_ctx->pred_y = mid_pred(preds[0].mvs[1][1], preds[0].mvs[2][1], preds[0].mvs[3][1]); |
| } else if (preds[0].nb == 3) { |
| me_ctx->pred_x = mid_pred(0, preds[0].mvs[1][0], preds[0].mvs[2][0]); |
| me_ctx->pred_y = mid_pred(0, preds[0].mvs[1][1], preds[0].mvs[2][1]); |
| } else if (preds[0].nb == 2) { |
| me_ctx->pred_x = preds[0].mvs[1][0]; |
| me_ctx->pred_y = preds[0].mvs[1][1]; |
| } else { |
| me_ctx->pred_x = 0; |
| me_ctx->pred_y = 0; |
| } |
| |
| ff_me_search_umh(me_ctx, x_mb, y_mb, mv); |
| |
| s->mv_table[0][mb_i][dir][0] = mv[0] - x_mb; |
| s->mv_table[0][mb_i][dir][1] = mv[1] - y_mb; |
| add_mv_data(((AVMotionVector *) sd->data) + mv_count++, me_ctx->mb_size, x_mb, y_mb, mv[0], mv[1], dir); |
| } |
| |
| } else if (s->method == AV_ME_METHOD_EPZS) { |
| |
| for (mb_y = 0; mb_y < s->b_height; mb_y++) |
| for (mb_x = 0; mb_x < s->b_width; mb_x++) { |
| const int mb_i = mb_x + mb_y * s->b_width; |
| const int x_mb = mb_x << s->log2_mb_size; |
| const int y_mb = mb_y << s->log2_mb_size; |
| int mv[2] = {x_mb, y_mb}; |
| |
| AVMotionEstPredictor *preds = me_ctx->preds; |
| preds[0].nb = 0; |
| preds[1].nb = 0; |
| |
| ADD_PRED(preds[0], 0, 0); |
| |
| //left mb in current frame |
| if (mb_x > 0) |
| ADD_PRED(preds[0], s->mv_table[0][mb_i - 1][dir][0], s->mv_table[0][mb_i - 1][dir][1]); |
| |
| //top mb in current frame |
| if (mb_y > 0) |
| ADD_PRED(preds[0], s->mv_table[0][mb_i - s->b_width][dir][0], s->mv_table[0][mb_i - s->b_width][dir][1]); |
| |
| //top-right mb in current frame |
| if (mb_y > 0 && mb_x + 1 < s->b_width) |
| ADD_PRED(preds[0], s->mv_table[0][mb_i - s->b_width + 1][dir][0], s->mv_table[0][mb_i - s->b_width + 1][dir][1]); |
| |
| //median predictor |
| if (preds[0].nb == 4) { |
| me_ctx->pred_x = mid_pred(preds[0].mvs[1][0], preds[0].mvs[2][0], preds[0].mvs[3][0]); |
| me_ctx->pred_y = mid_pred(preds[0].mvs[1][1], preds[0].mvs[2][1], preds[0].mvs[3][1]); |
| } else if (preds[0].nb == 3) { |
| me_ctx->pred_x = mid_pred(0, preds[0].mvs[1][0], preds[0].mvs[2][0]); |
| me_ctx->pred_y = mid_pred(0, preds[0].mvs[1][1], preds[0].mvs[2][1]); |
| } else if (preds[0].nb == 2) { |
| me_ctx->pred_x = preds[0].mvs[1][0]; |
| me_ctx->pred_y = preds[0].mvs[1][1]; |
| } else { |
| me_ctx->pred_x = 0; |
| me_ctx->pred_y = 0; |
| } |
| |
| //collocated mb in prev frame |
| ADD_PRED(preds[0], s->mv_table[1][mb_i][dir][0], s->mv_table[1][mb_i][dir][1]); |
| |
| //accelerator motion vector of collocated block in prev frame |
| ADD_PRED(preds[1], s->mv_table[1][mb_i][dir][0] + (s->mv_table[1][mb_i][dir][0] - s->mv_table[2][mb_i][dir][0]), |
| s->mv_table[1][mb_i][dir][1] + (s->mv_table[1][mb_i][dir][1] - s->mv_table[2][mb_i][dir][1])); |
| |
| //left mb in prev frame |
| if (mb_x > 0) |
| ADD_PRED(preds[1], s->mv_table[1][mb_i - 1][dir][0], s->mv_table[1][mb_i - 1][dir][1]); |
| |
| //top mb in prev frame |
| if (mb_y > 0) |
| ADD_PRED(preds[1], s->mv_table[1][mb_i - s->b_width][dir][0], s->mv_table[1][mb_i - s->b_width][dir][1]); |
| |
| //right mb in prev frame |
| if (mb_x + 1 < s->b_width) |
| ADD_PRED(preds[1], s->mv_table[1][mb_i + 1][dir][0], s->mv_table[1][mb_i + 1][dir][1]); |
| |
| //bottom mb in prev frame |
| if (mb_y + 1 < s->b_height) |
| ADD_PRED(preds[1], s->mv_table[1][mb_i + s->b_width][dir][0], s->mv_table[1][mb_i + s->b_width][dir][1]); |
| |
| ff_me_search_epzs(me_ctx, x_mb, y_mb, mv); |
| |
| s->mv_table[0][mb_i][dir][0] = mv[0] - x_mb; |
| s->mv_table[0][mb_i][dir][1] = mv[1] - y_mb; |
| add_mv_data(((AVMotionVector *) sd->data) + mv_count++, s->mb_size, x_mb, y_mb, mv[0], mv[1], dir); |
| } |
| } |
| } |
| |
| return ff_filter_frame(ctx->outputs[0], out); |
| } |
| |
| static av_cold void uninit(AVFilterContext *ctx) |
| { |
| MEContext *s = ctx->priv; |
| int i; |
| |
| av_frame_free(&s->prev); |
| av_frame_free(&s->cur); |
| av_frame_free(&s->next); |
| |
| for (i = 0; i < 3; i++) |
| av_freep(&s->mv_table[i]); |
| } |
| |
| static const AVFilterPad mestimate_inputs[] = { |
| { |
| .name = "default", |
| .type = AVMEDIA_TYPE_VIDEO, |
| .filter_frame = filter_frame, |
| .config_props = config_input, |
| }, |
| { NULL } |
| }; |
| |
| static const AVFilterPad mestimate_outputs[] = { |
| { |
| .name = "default", |
| .type = AVMEDIA_TYPE_VIDEO, |
| }, |
| { NULL } |
| }; |
| |
| AVFilter ff_vf_mestimate = { |
| .name = "mestimate", |
| .description = NULL_IF_CONFIG_SMALL("Generate motion vectors."), |
| .priv_size = sizeof(MEContext), |
| .priv_class = &mestimate_class, |
| .uninit = uninit, |
| .query_formats = query_formats, |
| .inputs = mestimate_inputs, |
| .outputs = mestimate_outputs, |
| }; |