v5.16/lucas__kanade_8c_source.html

 /*

  * Copyright (C) 2014 G. de Croon

  *               2015 Freek van Tienen <freek.v.tienen@gmail.com>

  *               2016 Hrvoje Brezak <hrvoje.brezak@gmail.com>

  *

  * This file is part of Paparazzi.

  *

  * Paparazzi is free software; you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation; either version 2, or (at your option)

  * any later version.

  *

  * Paparazzi is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

  * GNU General Public License for more details.

  *

  * You should have received a copy of the GNU General Public License

  * along with Paparazzi; see the file COPYING.  If not, see

  * <http://www.gnu.org/licenses/>.

  */


 #include <stdlib.h>

 #include <stdio.h>

 #include <math.h>

 #include <string.h>

 #include "lucas_kanade.h"


 struct flow_t *opticFlowLK(struct image_t *new_img, struct image_t *old_img, struct point_t *points,

                            uint16_t *points_cnt, uint16_t half_window_size,

                            uint16_t subpixel_factor, uint8_t max_iterations, uint8_t step_threshold, uint8_t max_points, uint8_t pyramid_level,

                            uint8_t keep_bad_points)

 {


   // if no pyramids, use the old code:

   if (pyramid_level == 0) {

     // use the old code in this case:

     return opticFlowLK_flat(new_img, old_img, points, points_cnt, half_window_size, subpixel_factor, max_iterations,

                             step_threshold, max_points, keep_bad_points);

   }


   // Allocate some memory for returning the vectors

   struct flow_t *vectors = calloc(max_points, sizeof(struct flow_t));


   // Determine patch sizes and initialize neighborhoods

   uint16_t patch_size = 2 * half_window_size + 1;

   // TODO: Feature management shows that this threshold rejects corners maybe too often, maybe another formula could be chosen

   uint32_t error_threshold = (25 * 25) * (patch_size * patch_size);

   uint16_t padded_patch_size = patch_size + 2;

   uint16_t border_size = padded_patch_size / 2 + 2; // amount of padding added to images


   // Allocate memory for image pyramids

   struct image_t *pyramid_old = malloc(sizeof(struct image_t) * (pyramid_level + 1));

   struct image_t *pyramid_new = malloc(sizeof(struct image_t) * (pyramid_level + 1));


   // Build pyramid levels

   pyramid_build(old_img, pyramid_old, pyramid_level, border_size);

   pyramid_build(new_img, pyramid_new, pyramid_level, border_size);


   // Create the window images

   struct image_t window_I, window_J, window_DX, window_DY, window_diff;

   image_create(&window_I, padded_patch_size, padded_patch_size, IMAGE_GRAYSCALE);

   image_create(&window_J, patch_size, patch_size, IMAGE_GRAYSCALE);

   image_create(&window_DX, patch_size, patch_size, IMAGE_GRADIENT);

   image_create(&window_DY, patch_size, patch_size, IMAGE_GRADIENT);

   image_create(&window_diff, patch_size, patch_size, IMAGE_GRADIENT);


   // Iterate through pyramid levels

   for (int8_t LVL = pyramid_level; LVL != -1; LVL--) {

     uint16_t points_orig = *points_cnt;

     *points_cnt = 0;

     uint16_t new_p = 0;


     // Calculate the amount of points to skip

     float skip_points = (points_orig > max_points) ? (float)points_orig / max_points : 1;


     // Go through all points

     for (uint16_t i = 0; i < max_points && i < points_orig; i++) {

       uint16_t p = i * skip_points;


       if (LVL == pyramid_level) {

         // Convert point position on original image to a subpixel coordinate on the top pyramid level

         vectors[new_p].pos.x = (points[p].x * subpixel_factor) >> pyramid_level;

         vectors[new_p].pos.y = (points[p].y * subpixel_factor) >> pyramid_level;

         vectors[new_p].flow_x = 0;

         vectors[new_p].flow_y = 0;


       } else {

         // (5) use calculated flow as initial flow estimation for next level of pyramid

         vectors[new_p].pos.x = vectors[p].pos.x << 1;

         vectors[new_p].pos.y = vectors[p].pos.y << 1;

         vectors[new_p].flow_x = vectors[p].flow_x << 1;

         vectors[new_p].flow_y = vectors[p].flow_y << 1;

       }


       // If the pixel is outside original image, do not track it

       if ((((int32_t) vectors[new_p].pos.x + vectors[new_p].flow_x) < 0)

           || ((vectors[new_p].pos.x + vectors[new_p].flow_x) > (uint32_t)((pyramid_new[LVL].w - 1 - 2 * border_size)*

               subpixel_factor))

           || (((int32_t) vectors[new_p].pos.y + vectors[new_p].flow_y) < 0)

           || ((vectors[new_p].pos.y + vectors[new_p].flow_y) > (uint32_t)((pyramid_new[LVL].h - 1 - 2 * border_size)*

               subpixel_factor))) {

         if (keep_bad_points) {

           vectors[new_p].error = LARGE_FLOW_ERROR;

           new_p++;

           (*points_cnt)++;

         }

         continue;

       }


       // (1) determine the subpixel neighborhood in the old image

       image_subpixel_window(&pyramid_old[LVL], &window_I, &vectors[new_p].pos, subpixel_factor, border_size);


       // (2) get the x- and y- gradients

       image_gradients(&window_I, &window_DX, &window_DY);


       // (3) determine the 'G'-matrix [sum(Axx) sum(Axy); sum(Axy) sum(Ayy)], where sum is over the window

       int32_t G[4];

       image_calculate_g(&window_DX, &window_DY, G);


       // calculate G's determinant in subpixel units:

       int32_t Det = (G[0] * G[3] - G[1] * G[2]);


       // Check if the determinant is bigger than 1

       if (Det < 1) {

         if (keep_bad_points) {

           vectors[new_p].error = LARGE_FLOW_ERROR;

           new_p++;

           (*points_cnt)++;

         }

         continue;

       }


       // (4) iterate over taking steps in the image to minimize the error:

       bool tracked = true;


       for (uint8_t it = max_iterations; it--;) {

         struct point_t new_point = { vectors[new_p].pos.x  + vectors[new_p].flow_x,

                  vectors[new_p].pos.y + vectors[new_p].flow_y,

                  0, 0, 0

         };


         // If the pixel is outside original image, do not track it

         if ((((int32_t)vectors[new_p].pos.x  + vectors[new_p].flow_x) < 0)

             || (new_point.x > (uint32_t)((pyramid_new[LVL].w - 1 - 2 * border_size)*subpixel_factor))

             || (((int32_t)vectors[new_p].pos.y  + vectors[new_p].flow_y) < 0)

             || (new_point.y > (uint32_t)((pyramid_new[LVL].h - 1 - 2 * border_size)*subpixel_factor))) {

           tracked = false;

           break;

         }


         //     [a] get the subpixel neighborhood in the new image

         image_subpixel_window(&pyramid_new[LVL], &window_J, &new_point, subpixel_factor, border_size);


         //     [b] determine the image difference between the two neighborhoods

         uint32_t error = image_difference(&window_I, &window_J, &window_diff);


         if (error > error_threshold && it < max_iterations / 2) {

           tracked = false;

           break;

         }


         int32_t b_x = image_multiply(&window_diff, &window_DX, NULL) / 255;

         int32_t b_y = image_multiply(&window_diff, &window_DY, NULL) / 255;


         //     [d] calculate the additional flow step and possibly terminate the iteration

         int16_t step_x = (((int64_t) G[3] * b_x - G[1] * b_y) * subpixel_factor) / Det;

         int16_t step_y = (((int64_t) G[0] * b_y - G[2] * b_x) * subpixel_factor) / Det;


         vectors[new_p].flow_x = vectors[new_p].flow_x + step_x;

         vectors[new_p].flow_y = vectors[new_p].flow_y + step_y;

         vectors[new_p].error = error;


         // Check if we exceeded the treshold CHANGED made this better for 0.03

         if ((abs(step_x) + abs(step_y)) < step_threshold) {

           break;

         }

       } // lucas kanade step iteration


       // If we tracked the point we update the index and the count

       if (tracked) {

         new_p++;

         (*points_cnt)++;

       } else if (keep_bad_points) {

         vectors[new_p].flow_x = 0;

         vectors[new_p].flow_y = 0;

         vectors[new_p].error = LARGE_FLOW_ERROR;

         new_p++;

         (*points_cnt)++;

       }

     } // go through all points


   } // LVL of pyramid


   // Free the images

   image_free(&window_I);

   image_free(&window_J);

   image_free(&window_DX);

   image_free(&window_DY);

   image_free(&window_diff);


   for (int8_t i = pyramid_level; i != -1; i--) {

     image_free(&pyramid_old[i]);

     image_free(&pyramid_new[i]);

   }

   pyramid_old = NULL;

   pyramid_new = NULL;


   // Return the vectors

   return vectors;

 }


 struct flow_t *opticFlowLK_flat(struct image_t *new_img, struct image_t *old_img, struct point_t *points, uint16_t *points_cnt,

                                 uint16_t half_window_size, uint16_t subpixel_factor, uint8_t max_iterations, uint8_t step_threshold,

                                 uint16_t max_points, uint8_t keep_bad_points)

 {

   // A straightforward one-level implementation of Lucas-Kanade.

   // For all points:

   // (1) determine the subpixel neighborhood in the old image

   // (2) get the x- and y- gradients

   // (3) determine the 'G'-matrix [sum(Axx) sum(Axy); sum(Axy) sum(Ayy)], where sum is over the window

   // (4) iterate over taking steps in the image to minimize the error:

   //     [a] get the subpixel neighborhood in the new image

   //     [b] determine the image difference between the two neighborhoods

   //     [c] calculate the 'b'-vector

   //     [d] calculate the additional flow step and possibly terminate the iteration


   // Allocate some memory for returning the vectors

   struct flow_t *vectors = calloc(max_points, sizeof(struct flow_t));

   uint16_t new_p = 0;

   uint16_t points_orig = *points_cnt;

   *points_cnt = 0;


   // determine patch sizes and initialize neighborhoods

   uint16_t patch_size = 2 * half_window_size;

   uint32_t error_threshold = (25 * 25) * (patch_size * patch_size);

   uint16_t padded_patch_size = patch_size + 2;


   // Create the window images

   struct image_t window_I, window_J, window_DX, window_DY, window_diff;

   image_create(&window_I, padded_patch_size, padded_patch_size, IMAGE_GRAYSCALE);

   image_create(&window_J, patch_size, patch_size, IMAGE_GRAYSCALE);

   image_create(&window_DX, patch_size, patch_size, IMAGE_GRADIENT);

   image_create(&window_DY, patch_size, patch_size, IMAGE_GRADIENT);

   image_create(&window_diff, patch_size, patch_size, IMAGE_GRADIENT);


   // Calculate the amount of points to skip

   float skip_points = (points_orig > max_points) ? (float)points_orig / max_points : 1;


   // Go through all points

   for (uint16_t i = 0; i < max_points && i < points_orig; i++) {

     uint16_t p = i * skip_points;


     // Convert the point to a subpixel coordinate

     vectors[new_p].pos.x = points[p].x * subpixel_factor;

     vectors[new_p].pos.y = points[p].y * subpixel_factor;


     // If the pixel is outside ROI, do not track it

     if (points[p].x < half_window_size || (old_img->w - points[p].x) < half_window_size

         || points[p].y < half_window_size || (old_img->h - points[p].y) < half_window_size) {

       if (keep_bad_points) {

         vectors[new_p].error = LARGE_FLOW_ERROR;

         new_p++;

         (*points_cnt)++;

       }

       continue;

     }


     // (1) determine the subpixel neighborhood in the old image

     image_subpixel_window(old_img, &window_I, &vectors[new_p].pos, subpixel_factor, 0);


     // (2) get the x- and y- gradients

     image_gradients(&window_I, &window_DX, &window_DY);


     // (3) determine the 'G'-matrix [sum(Axx) sum(Axy); sum(Axy) sum(Ayy)], where sum is over the window

     int32_t G[4];

     image_calculate_g(&window_DX, &window_DY, G);


     // calculate G's determinant in subpixel units:

     int32_t Det = (G[0] * G[3] - G[1] * G[2]) / subpixel_factor;


     // Check if the determinant is bigger than 1

     if (Det < 1) {

       if (keep_bad_points) {

         vectors[new_p].error = LARGE_FLOW_ERROR;

         new_p++;

         (*points_cnt)++;

       }

       continue;

     }


     // a * (Ax - Bx) + (1-a) * (Ax+1 - Bx+1)

     // a * Ax - a * Bx + (1-a) * Ax+1 - (1-a) * Bx+1

     // (a * Ax + (1-a) * Ax+1)  - (a * Bx + (1-a) * Bx+1)


     // (4) iterate over taking steps in the image to minimize the error:

     bool tracked = TRUE;

     for (uint8_t it = 0; it < max_iterations; it++) {

       struct point_t new_point =  {

         vectors[new_p].pos.x + vectors[new_p].flow_x,

         vectors[new_p].pos.y + vectors[new_p].flow_y,

         0, 0, 0

       };

       // If the pixel is outside ROI, do not track it

       if (new_point.x / subpixel_factor < half_window_size || (old_img->w - new_point.x / subpixel_factor) <= half_window_size

           || new_point.y / subpixel_factor < half_window_size || (old_img->h - new_point.y / subpixel_factor) <= half_window_size

           || new_point.x / subpixel_factor > old_img->w || new_point.y / subpixel_factor > old_img->h) {

         tracked = FALSE;

         break;

       }


       //     [a] get the subpixel neighborhood in the new image

       image_subpixel_window(new_img, &window_J, &new_point, subpixel_factor, 0);


       //     [b] determine the image difference between the two neighborhoods

       // TODO: also give this error back, so that it can be used for reliability

       uint32_t error = image_difference(&window_I, &window_J, &window_diff);

       if (error > error_threshold && it > max_iterations / 2) {

         tracked = FALSE;

         break;

       }


       int32_t b_x = image_multiply(&window_diff, &window_DX, NULL) / 255;

       int32_t b_y = image_multiply(&window_diff, &window_DY, NULL) / 255;


       //     [d] calculate the additional flow step and possibly terminate the iteration

       int16_t step_x = (G[3] * b_x - G[1] * b_y) / Det;

       int16_t step_y = (G[0] * b_y - G[2] * b_x) / Det;

       vectors[new_p].flow_x += step_x;

       vectors[new_p].flow_y += step_y;

       vectors[new_p].error = error;


       // Check if we exceeded the threshold

       if ((abs(step_x) + abs(step_y)) < step_threshold) {

         break;

       }

     }


     // If we tracked the point we update the index and the count

     if (tracked) {

       new_p++;

       (*points_cnt)++;

     } else if (keep_bad_points) {

       vectors[new_p].flow_x = 0;

       vectors[new_p].flow_y = 0;

       vectors[new_p].error = LARGE_FLOW_ERROR;

       new_p++;

       (*points_cnt)++;

     }

   }


   // Free the images

   image_free(&window_I);

   image_free(&window_J);

   image_free(&window_DX);

   image_free(&window_DY);

   image_free(&window_diff);


   // Return the vectors

   return vectors;

 }

uint16_t
unsigned short uint16_t
Definition: types.h:16

image_gradients
void image_gradients(struct image_t *input, struct image_t *dx, struct image_t *dy)
Calculate the gradients using the following matrix: [0 -1 0; -1 0 1; 0 1 0].
Definition: image.c:532

image_difference
uint32_t image_difference(struct image_t *img_a, struct image_t *img_b, struct image_t *diff)
Calculate the difference between two images and return the error This will only work with grayscale i...
Definition: image.c:588

image_free
void image_free(struct image_t *img)
Free the image.
Definition: image.c:69

LARGE_FLOW_ERROR
#define LARGE_FLOW_ERROR
Definition: lucas_kanade.h:37

flow_t::flow_y
int32_t flow_y
The y direction flow in subpixels.
Definition: image.h:69

image_create
void image_create(struct image_t *img, uint16_t width, uint16_t height, enum image_type type)
Create a new image.
Definition: image.c:43

image_t
Definition: image.h:43

flow_t
Definition: image.h:66

patch_size
uint8_t patch_size
Definition: textons.c:97

int64_t
signed long long int64_t
Definition: types.h:21

point_t::x
uint32_t x
The x coordinate of the point.
Definition: image.h:58

FALSE
#define FALSE
Definition: std.h:5

pyramid_build
void pyramid_build(struct image_t *input, struct image_t *output_array, uint8_t pyr_level, uint16_t border_size)
This function populates given array of image_t structs with wanted number of padded pyramids based on...
Definition: image.c:447

TRUE
#define TRUE
Definition: std.h:4

image_t::w
uint16_t w
Image width.
Definition: image.h:45

uint32_t
unsigned long uint32_t
Definition: types.h:18

image_t::h
uint16_t h
Image height.
Definition: image.h:46

int16_t
signed short int16_t
Definition: types.h:17

flow_t::pos
struct point_t pos
The original position the flow comes from in subpixels.
Definition: image.h:67

point_t::y
uint32_t y
The y coordinate of the point.
Definition: image.h:59

point_t
Definition: image.h:57

int32_t
signed long int32_t
Definition: types.h:19

flow_t::error
uint32_t error
The matching error in the tracking process in subpixels.
Definition: image.h:70

opticFlowLK_flat
struct flow_t * opticFlowLK_flat(struct image_t *new_img, struct image_t *old_img, struct point_t *points, uint16_t *points_cnt, uint16_t half_window_size, uint16_t subpixel_factor, uint8_t max_iterations, uint8_t step_threshold, uint16_t max_points, uint8_t keep_bad_points)
Compute the optical flow of several points using the Lucas-Kanade algorithm by Yves Bouguet The initi...
Definition: lucas_kanade.c:275

uint8_t
unsigned char uint8_t
Definition: types.h:14

lucas_kanade.h
efficient fixed-point optical-flow calculation

p
static float p[2][2]
Definition: ins_alt_float.c:268

IMAGE_GRAYSCALE
Grayscale image with only the Y part (uint8 per pixel)
Definition: image.h:37

image_calculate_g
void image_calculate_g(struct image_t *dx, struct image_t *dy, int32_t *g)
Calculate the G vector of an image gradient This is used for optical flow calculation.
Definition: image.c:556

int8_t
signed char int8_t
Definition: types.h:15

IMAGE_GRADIENT
An image gradient (int16 per pixel)
Definition: image.h:39

flow_t::flow_x
int32_t flow_x
The x direction flow in subpixels.
Definition: image.h:68

image_multiply
int32_t image_multiply(struct image_t *img_a, struct image_t *img_b, struct image_t *mult)
Calculate the multiplication between two images and return the error This will only work with image g...
Definition: image.c:626

image_subpixel_window
void image_subpixel_window(struct image_t *input, struct image_t *output, struct point_t *center, uint32_t subpixel_factor, uint8_t border_size)
This outputs a subpixel window image in grayscale Currently only works with Grayscale images as input...
Definition: image.c:474

opticFlowLK
struct flow_t * opticFlowLK(struct image_t *new_img, struct image_t *old_img, struct point_t *points, uint16_t *points_cnt, uint16_t half_window_size, uint16_t subpixel_factor, uint8_t max_iterations, uint8_t step_threshold, uint8_t max_points, uint8_t pyramid_level, uint8_t keep_bad_points)
Definition: lucas_kanade.c:74