disflow.h - mozsearch

Enable keyboard shortcuts

/*

 * Copyright (c) 2016, Alliance for Open Media. All rights reserved.

 * This source code is subject to the terms of the BSD 2 Clause License and

 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License

 * was not distributed with this source code in the LICENSE file, you can

 * obtain it at www.aomedia.org/license/software. If the Alliance for Open

 * Media Patent License 1.0 was not distributed with this source code in the

 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.

*/

#ifndef AOM_AOM_DSP_FLOW_ESTIMATION_DISFLOW_H_

#define AOM_AOM_DSP_FLOW_ESTIMATION_DISFLOW_H_

#include <stdbool.h>

#include "aom_dsp/flow_estimation/flow_estimation.h"

#include "aom_scale/yv12config.h"

#ifdef __cplusplus

extern "C" {

#endif

// Number of pyramid levels in disflow computation

#define DISFLOW_PYRAMID_LEVELS 12

// Size of square patches in the disflow dense grid

// Must be a power of 2

#define DISFLOW_PATCH_SIZE_LOG2 3

#define DISFLOW_PATCH_SIZE (1 << DISFLOW_PATCH_SIZE_LOG2)

// Center point of square patch

#define DISFLOW_PATCH_CENTER ((DISFLOW_PATCH_SIZE / 2) - 1)

// Overall scale of the `dx`, `dy` and `dt` arrays in the disflow code

// In other words, the various derivatives are calculated with an internal

// precision of (8 + DISFLOW_DERIV_SCALE_LOG2) bits, from an 8-bit input.

//

// This must be carefully synchronized with the code in sobel_filter()

// (which fills the dx and dy arrays) and compute_flow_error() (which

// fills dt); see the comments in those functions for more details

#define DISFLOW_DERIV_SCALE_LOG2 3

#define DISFLOW_DERIV_SCALE (1 << DISFLOW_DERIV_SCALE_LOG2)

// Scale factor applied to each step in the main refinement loop

//

// This should be <= 1.0 to avoid overshoot. Values below 1.0

// may help in some cases, but slow convergence overall, so

// will require careful tuning.

// TODO(rachelbarker): Tune this value

#define DISFLOW_STEP_SIZE 1.0

// Step size at which we should terminate iteration

// The idea here is that, if we take a step which is much smaller than 1px in

// size, then the values won't change much from iteration to iteration, so

// many future steps will also be small, and that won't have much effect

// on the ultimate result. So we can terminate early.

//

// To look at it another way, when we take a small step, that means that

// either we're near to convergence (so can stop), or we're stuck in a

// shallow valley and will take many iterations to get unstuck.

//

// Solving the latter properly requires fancier methods, such as "gradient

// descent with momentum". For now, we terminate to avoid wasting a ton of

// time on points which are either nearly-converged or stuck.

//

// Terminating at 1/8 px seems to give good results for global motion estimation

#define DISFLOW_STEP_SIZE_THRESOLD (1. / 8.)

// Max number of iterations if warp convergence is not found

#define DISFLOW_MAX_ITR 4

// Internal precision of cubic interpolation filters

// The limiting factor here is that:

// * Before integerizing, the maximum value of any kernel tap is 1.0

// * After integerizing, each tap must fit into an int16_t.

// Thus the largest multiplier we can get away with is 2^14 = 16384,

// as 2^15 = 32768 is too large to fit in an int16_t.

#define DISFLOW_INTERP_BITS 14

typedef struct {

  // Start of allocation for u and v buffers

  double *buf0;

  // x and y directions of flow, per patch

  double *u;

  double *v;

  // Sizes of the above arrays

  int width;

  int height;

  int stride;

} FlowField;

bool av1_compute_global_motion_disflow(

    TransformationType type, YV12_BUFFER_CONFIG *src, YV12_BUFFER_CONFIG *ref,

    int bit_depth, int downsample_level, MotionModel *motion_models,

    int num_motion_models, bool *mem_alloc_failed);

#ifdef __cplusplus

#endif

#endif  // AOM_AOM_DSP_FLOW_ESTIMATION_DISFLOW_H_