latest/textons_8c_source.html

/*

 * Copyright (C) 2016, Hann Woei Ho, Guido de Croon

 *

 * This file is part of Paparazzi.

 *

 * Paparazzi is free software; you can redistribute it and/or modify

 * it under the terms of the GNU General Public License as published by

 * the Free Software Foundation; either version 2, or (at your option)

 * any later version.

 *

 * Paparazzi is distributed in the hope that it will be useful,

 * but WITHOUT ANY WARRANTY; without even the implied warranty of

 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

 * GNU General Public License for more details.

 *

 * You should have received a copy of the GNU General Public License

 * along with Paparazzi; see the file COPYING.  If not, write to

 * the Free Software Foundation, 59 Temple Place - Suite 330,

 * Boston, MA 02111-1307, USA.

 */


#include <stdlib.h>

#include <stdio.h>

#include "modules/computer_vision/cv.h"

#include "modules/computer_vision/textons.h"

#include "mcu_periph/sys_time.h"

#include "generated/airframe.h"


float ** **dictionary;

uint32_t learned_samples = 0;

uint8_t dictionary_initialized = 0;

float *texton_distribution;


#define MAX_N_TEXTONS 255


// initial settings:

#ifndef TEXTONS_RUN

#define TEXTONS_RUN 1

#endif

PRINT_CONFIG_VAR(TEXTONS_RUN)


#ifndef TEXTONS_FPS

#define TEXTONS_FPS 30

#endif

PRINT_CONFIG_VAR(TEXTONS_FPS)


#ifndef TEXTONS_LOAD_DICTIONARY

#define TEXTONS_LOAD_DICTIONARY 1

#endif

PRINT_CONFIG_VAR(TEXTONS_LOAD_DICTIONARY)


#ifndef TEXTONS_REINITIALIZE_DICTIONARY

#define TEXTONS_REINITIALIZE_DICTIONARY 0

#endif

PRINT_CONFIG_VAR(TEXTONS_REINITIALIZE_DICTIONARY)


#ifndef TEXTONS_ALPHA

#define TEXTONS_ALPHA 0

#endif

PRINT_CONFIG_VAR(TEXTONS_ALPHA)


#ifndef TEXTONS_N_TEXTONS

#define TEXTONS_N_TEXTONS 20

#endif

PRINT_CONFIG_VAR(TEXTONS_N_TEXTONS)


#ifndef TEXTONS_N_SAMPLES

#define TEXTONS_N_SAMPLES 250

#endif

PRINT_CONFIG_VAR(TEXTONS_N_SAMPLES)


#ifndef TEXTONS_PATCH_SIZE

#define TEXTONS_PATCH_SIZE 6

#endif

PRINT_CONFIG_VAR(TEXTONS_PATCH_SIZE)


#ifndef TEXTONS_N_LEARNING_SAMPLES

#define TEXTONS_N_LEARNING_SAMPLES 5000

#endif

PRINT_CONFIG_VAR(TEXTONS_N_LEARNING_SAMPLES)


#ifndef TEXTONS_FULL_SAMPLING

#define TEXTONS_FULL_SAMPLING 0

#endif

PRINT_CONFIG_VAR(TEXTONS_FULL_SAMPLING)


#ifndef TEXTONS_BORDER_WIDTH

#define TEXTONS_BORDER_WIDTH 0

#endif

PRINT_CONFIG_VAR(TEXTONS_BORDER_WIDTH)


#ifndef TEXTONS_BORDER_HEIGHT

#define TEXTONS_BORDER_HEIGHT 0

#endif

PRINT_CONFIG_VAR(TEXTONS_BORDER_HEIGHT)


#ifndef TEXTONS_DICTIONARY_NUMBER

#define TEXTONS_DICTIONARY_NUMBER 0

#endif

PRINT_CONFIG_VAR(TEXTONS_DICTIONARY_NUMBER)


#ifndef TEXTONS_DICTIONARY_PATH

#define TEXTONS_DICTIONARY_PATH /data/ftp/internal_000

#endif


struct video_listener *listener = NULL;


uint8_t running = TEXTONS_RUN;

uint8_t load_dictionary = TEXTONS_LOAD_DICTIONARY;

uint8_t reinitialize_dictionary = TEXTONS_REINITIALIZE_DICTIONARY;

uint8_t alpha_uint = TEXTONS_ALPHA;

uint8_t n_textons = TEXTONS_N_TEXTONS;

uint8_t patch_size = TEXTONS_PATCH_SIZE;

uint32_t n_learning_samples = TEXTONS_N_LEARNING_SAMPLES;

uint32_t n_samples_image = TEXTONS_N_SAMPLES;

uint8_t FULL_SAMPLING = TEXTONS_FULL_SAMPLING;

uint32_t border_width = TEXTONS_BORDER_WIDTH;

uint32_t border_height = TEXTONS_BORDER_HEIGHT;

uint8_t dictionary_number = TEXTONS_DICTIONARY_NUMBER;


// status variables

uint8_t dictionary_ready = 0;

float alpha = 0.0;


// File pointer for saving the dictionary

static FILE *dictionary_logger = NULL;


struct image_t *texton_func(struct image_t *img, UNUSED uint8_t p);


struct image_t *texton_func(struct image_t *img, UNUSED uint8_t p)

{

  // whether to execute the function:

  if (!running) { return img; }


  if (img->buf_size == 0) { return img; }


  // extract frame from img struct:

  uint8_t *frame = (uint8_t *)img->buf;


  // if patch size odd, correct:

  if (patch_size % 2 == 1) { patch_size++; }


  // check whether we have to reinitialize the dictionary:

  if (reinitialize_dictionary) {

    // set all vars to trigger a reinitialization and learning phase of the dictionary:

    dictionary_ready = 0;

    dictionary_initialized = 0;

    load_dictionary = 0;

    learned_samples = 0;

    alpha_uint = 10;

    // reset reinitialize_dictionary

    reinitialize_dictionary = 0;

  }


  // if dictionary not initialized:

  if (dictionary_ready == 0) {

    if (load_dictionary == 0) {


      printf("Learned samples: %d / %d\n", learned_samples, n_learning_samples);


      // Train the dictionary:

      DictionaryTrainingYUV(frame, img->w, img->h);


      // After a number of samples, stop learning:

      if (learned_samples >= n_learning_samples) {

        // Save the dictionary:

        save_texton_dictionary();

        // stop learning:

        dictionary_ready = 1;

        // lower learning rate

        alpha = 0.0;

        printf("Enough learning!\n");

        alpha_uint = 0;

        // set learned samples back to 0

        learned_samples = 0;

      }

    } else {

      // Load the dictionary:

      load_texton_dictionary();

    }

  } else {

    if (alpha_uint > 0) {


      // printf("Learning, frame time = %d\n", img->ts.tv_sec * 1000 + img->ts.tv_usec / 1000);


      DictionaryTrainingYUV(frame, img->w, img->h);


      if (learned_samples >= n_learning_samples) {

        // Save the dictionary:

        save_texton_dictionary();

        // reset learned_samples:

        learned_samples = 0;

      }

    } else {

      // Extract distributions

      DistributionExtraction(frame, img->w, img->h);

    }


    // printf("N textons = %d\n", n_samples_image);

    // printf("Entropy texton distribution = %f\n", get_entropy(texton_distribution, n_textons));

  }


  return img; // Colorfilter did not make a new image

}

struct image_t *texton_func(struct image_t *img, UNUSED uint8_t p) {…}


void DictionaryTrainingYUV(uint8_t *frame, uint16_t width, uint16_t height)

{

  int i, j, w, s, texton, c; // iterators

  int x, y; // image coordinates

  float error_texton; // distance between an image patch and a texton


  uint8_t *buf;


  // ***********************

  //   DICTIONARY LEARNING

  // ***********************


  if (!dictionary_initialized) {

    // **************

    // INITIALISATION

    // **************


    printf("Intializing dictionary!\n");


    // in the first image, we initialize the textons to random patches in the image

    for (w = 0; w < n_textons; w++) {

      // select a coordinate

      x = rand() % (width - patch_size);

      y = rand() % (height - patch_size);


      //printf("(x,y) = (%d,%d), (w,h) = (%d,%d), ps = %d\n", x, y, width, height, patch_size);

      // take the sample

      for (i = 0; i < patch_size; i++) {

        buf = frame + (width * 2 * (i + y)) + 2 * x;

        for (j = 0; j < patch_size; j++) {

          // put it in a texton

          printf("Setting dictionary:\n");

          // U/V component


          dictionary[w][i][j][0] = (float) * buf;

          buf += 1;

          // Y1/Y2 component

          dictionary[w][i][j][1] = (float) * buf;

          buf += 1;

          printf("Done!\n");

        }

      }

    }

    dictionary_initialized = 1;

  } else {

    // ********

    // LEARNING

    // ********

    printf("Learning!");

    alpha = ((float) alpha_uint) / 255.0;


    float *texton_distances, * **patch;

    texton_distances = (float *)calloc(n_textons, sizeof(float));

    patch = (float ** *)calloc(patch_size, sizeof(float **));


    for (i = 0; i < patch_size; i++) {

      patch[i] = (float **)calloc(patch_size, sizeof(float *));

      for (j = 0; j < patch_size; j++) {

        patch[i][j] = (float *)calloc(2, sizeof(float));

      }

    }


    // Extract and learn from n_samples_image per image

    for (s = 0; s < (int) n_samples_image; s++) {

      // select a random sample from the image

      x = rand() % (width - patch_size);

      y = rand() % (height - patch_size);


      // reset texton_distances

      for (texton = 0; texton < n_textons; texton++) {

        texton_distances[texton] = 0;

      }


      // extract sample

      for (i = 0; i < patch_size; i++) {

        buf = frame + (width * 2 * (i + y)) + 2 * x;

        for (j = 0; j < patch_size; j++) {

          // U/V component

          patch[i][j][0] = (float) * buf;

          buf += 1;

          // Y1/Y2 component

          patch[i][j][1] = (float) * buf;

          buf += 1;

        }

      }


      // determine distances to the textons:

      for (i = 0; i < patch_size; i++) {

        for (j = 0; j < patch_size; j++) {

          for (c = 0; c < 2; c++) {

            // determine the distance to textons

            for (texton = 0; texton < n_textons; texton++) {

              texton_distances[texton] += (patch[i][j][c] - dictionary[texton][i][j][c])

                                          * (patch[i][j][c] - dictionary[texton][i][j][c]);

            }

          }

        }

      }


      // search the closest texton

      int assignment = 0;

      float min_dist = texton_distances[0];

      for (texton = 1; texton < n_textons; texton++) {

        if (texton_distances[texton] < min_dist) {

          min_dist = texton_distances[texton];

          assignment = texton;

        }

      }


      // move the neighbour closer to the input

      for (i = 0; i < patch_size; i++) {

        for (j = 0; j < patch_size; j++) {

          for (c = 0; c < 2; c++) {

            error_texton = patch[i][j][c] - dictionary[assignment][i][j][c];

            dictionary[assignment][i][j][c] += (alpha * error_texton);

          }

        }

      }


      // Augment the number of learned samples:

      learned_samples++;

    }


    // Free the allocated memory:

    for (i = 0; i < patch_size; i++) {

      for (j = 0; j < patch_size; j++) {

        free(patch[i][j]);

      }

      free(patch[i]);

    }

    free(patch);

    free(texton_distances);

  }


  // Free the buffer

  buf = NULL;

  free(buf);

}

void DictionaryTrainingYUV(uint8_t *frame, uint16_t width, uint16_t height) {…}


void DistributionExtraction(uint8_t *frame, uint16_t width, uint16_t height)

{

  int i, j, texton, c; // iterators

  int x, y; // coordinates

  int n_extracted_textons = 0;


  uint8_t *buf;


  // ************************

  //       EXECUTION

  // ************************


  // Allocate memory for texton distances and image patch:

  float *texton_distances, * **patch;

  texton_distances = (float *)calloc(n_textons, sizeof(float));

  patch = (float ** *)calloc(patch_size, sizeof(float **));

  for (i = 0; i < patch_size; i++) {

    patch[i] = (float **)calloc(patch_size, sizeof(float *));

    for (j = 0; j < patch_size; j++) {

      patch[i][j] = (float *)calloc(2, sizeof(float));

    }

  }


  int finished = 0;

  x = 0;

  y = 0;

  while (!finished) {

    if (!FULL_SAMPLING) {

      x = border_width + rand() % (width - patch_size - 2 * border_width);

      y = border_height + rand() % (height - patch_size - 2 * border_height);

    }


    // reset texton_distances

    for (texton = 0; texton < n_textons; texton++) {

      texton_distances[texton] = 0;

    }


    // extract sample

    for (i = 0; i < patch_size; i++) {

      buf = frame + (width * 2 * (i + y)) + 2 * x;

      for (j = 0; j < patch_size; j++) {

        // U/V component

        patch[i][j][0] = (float) * buf;

        buf += 1;

        // Y1/Y2 component

        patch[i][j][1] = (float) * buf;

        buf += 1;

      }

    }


    // determine distances:

    for (i = 0; i < patch_size; i++) {

      for (j = 0; j < patch_size; j++) {

        for (c = 0; c < 2; c++) {

          // determine the distance to words

          for (texton = 0; texton < n_textons; texton++) {

            texton_distances[texton] += (patch[i][j][c] - dictionary[texton][i][j][c])

                                        * (patch[i][j][c] - dictionary[texton][i][j][c]);

          }

        }

      }

    }


    // determine the nearest neighbour

    // search the closest centroid

    int assignment = 0;

    float min_dist = texton_distances[0];

    for (texton = 1; texton < n_textons; texton++) {

      if (texton_distances[texton] < min_dist) {

        min_dist = texton_distances[texton];

        assignment = texton;

      }

    }


    // put the assignment in the histogram

    texton_distribution[assignment]++;

    n_extracted_textons++;


    if (!FULL_SAMPLING && n_extracted_textons == (int) n_samples_image) {

      finished = 1;

    } else {

      // FULL_SAMPLING is actually a sampling that covers the image:

      y += patch_size;

      // True full sampling would require:

      // y++;


      if (y > height - patch_size) {

        if (!FULL_SAMPLING) {

          x += patch_size;

        } else {

          x++;

        }

        y = 0;

      }

      if (x > width - patch_size) {

        finished = 1;

      }

    }

  }


  // Normalize distribution:

  if (n_extracted_textons > 0) { // should always be the case

    for (i = 0; i < n_textons; i++) {

      texton_distribution[i] = texton_distribution[i] / (float) n_extracted_textons;

    }

  }

  // printf("\n");


  // free memory:

  for (i = 0; i < patch_size; i++) {

    for (j = 0; j < patch_size; j++) {

      free(patch[i][j]);

    }

    free(patch[i]);

  }

  free(patch);

  free(texton_distances);


  buf = NULL;

  free(buf);


} // EXECUTION

void DistributionExtraction(uint8_t *frame, uint16_t width, uint16_t height) {…}


void save_texton_dictionary(void)

{

  //save a dictionary

  char filename[512];


  // Check for available files

  sprintf(filename, "%s/Dictionary_%05d.dat", STRINGIFY(TEXTONS_DICTIONARY_PATH), dictionary_number);


  dictionary_logger = fopen(filename, "w");


  if (dictionary_logger == NULL) {

    printf("Filename: %s\n", filename);

    perror("Error while opening the file.\n");

  } else {

    // (over-)write dictionary

    for (uint8_t i = 0; i < n_textons; i++) {

      for (uint8_t j = 0; j < patch_size; j++) {

        for (uint8_t k = 0; k < patch_size; k++) {

          fprintf(dictionary_logger, "%f\n", dictionary[i][j][k][0]);

          fprintf(dictionary_logger, "%f\n", dictionary[i][j][k][1]);

        }

      }

    }

    fclose(dictionary_logger);

  }


}

void save_texton_dictionary(void) {…}


void load_texton_dictionary(void)

{

  char filename[512];

  sprintf(filename, "%s/Dictionary_%05d.dat", STRINGIFY(TEXTONS_DICTIONARY_PATH), dictionary_number);


  if ((dictionary_logger = fopen(filename, "r"))) {

    // Load the dictionary:

    for (int i = 0; i < n_textons; i++) {

      for (int j = 0; j < patch_size; j++) {

        for (int k = 0; k < patch_size; k++) {

          if (fscanf(dictionary_logger, "%f\n", &dictionary[i][j][k][0]) == EOF) { break; }

          if (fscanf(dictionary_logger, "%f\n", &dictionary[i][j][k][1]) == EOF) { break; }

        }

      }

    }


    fclose(dictionary_logger);

    dictionary_ready = 1;

  } else {

    // If the given dictionary does not exist, we start learning one:

    printf("Texton dictionary %d does not exist, we start learning one.\n", dictionary_number);

    load_dictionary = 0;

    learned_samples = 0;

    dictionary_initialized = 0;

  }

}

void load_texton_dictionary(void) {…}


void textons_init(void)

{

  printf("Textons init\n");

  texton_distribution = (float *)calloc(MAX_N_TEXTONS, sizeof(float));

  dictionary_initialized = 0;

  learned_samples = 0;

  dictionary_ready = 0;

  dictionary = (float ** **)calloc(MAX_N_TEXTONS, sizeof(float ** *));

  for (int w = 0; w < MAX_N_TEXTONS; w++) {

    dictionary[w] = (float ** *) calloc(patch_size, sizeof(float **));

    for (int i = 0; i < patch_size; i++) {

      dictionary[w][i] = (float **) calloc(patch_size, sizeof(float *));

      for (int j = 0; j < patch_size; j++) {

        dictionary[w][i][j] = (float *) calloc(2, sizeof(float));

      }

    }

  }


  listener = cv_add_to_device(&TEXTONS_CAMERA, texton_func, TEXTONS_FPS, 0);

}

void textons_init(void) {…}


void textons_stop(void)

{

  free(texton_distribution);

  free(dictionary);

}

void textons_stop(void) {…}


float get_entropy(float *p_dist, int D)

{

  float entropy = 0.0f;

  int i;

  for (i = 0; i < D; i++) {

    if (p_dist[i] > 0) {

      entropy -= p_dist[i] * log2(p_dist[i]);

    }

  }


  return entropy;

}

float get_entropy(float *p_dist, int D) {…}

frame
static uint8_t frame[20]
Definition cc2500_frsky_x.c:163

UNUSED
#define UNUSED(x)
Definition cc2500_frsky_x.c:12

cv_add_to_device
struct video_listener * cv_add_to_device(struct video_config_t *device, cv_function func, uint16_t fps, uint8_t id)
Definition cv.c:46

cv.h
Computer vision framework for onboard processing.

video_listener
Definition cv.h:51

image_t::buf
void * buf
Image buffer (depending on the image_type)
Definition image.h:54

image_t::w
uint16_t w
Image width.
Definition image.h:46

image_t
Definition image.h:44

p
static float p[2][2]
Definition ins_alt_float.c:273

s
static uint32_t s
Definition light_scheduler.c:33

foo
uint16_t foo
Definition main_demo5.c:58

PRINT_CONFIG_VAR
PRINT_CONFIG_VAR(ONELOOP_ANDI_FILT_CUTOFF)

sys_time.h
Architecture independent timing functions.

save_texton_dictionary
void save_texton_dictionary(void)
Save the texton dictionary.
Definition textons.c:501

listener
struct video_listener * listener
Definition textons.c:116

load_texton_dictionary
void load_texton_dictionary(void)
Load a texton dictionary.
Definition textons.c:532

TEXTONS_FPS
#define TEXTONS_FPS
Definition textons.c:53

texton_distribution
float * texton_distribution
Definition textons.c:42

TEXTONS_ALPHA
#define TEXTONS_ALPHA
Definition textons.c:68

TEXTONS_PATCH_SIZE
#define TEXTONS_PATCH_SIZE
Definition textons.c:83

patch_size
uint8_t patch_size
Definition textons.c:123

n_learning_samples
uint32_t n_learning_samples
Definition textons.c:124

load_dictionary
uint8_t load_dictionary
Definition textons.c:119

n_textons
uint8_t n_textons
Definition textons.c:122

TEXTONS_DICTIONARY_NUMBER
#define TEXTONS_DICTIONARY_NUMBER
Definition textons.c:108

FULL_SAMPLING
uint8_t FULL_SAMPLING
Definition textons.c:126

TEXTONS_N_TEXTONS
#define TEXTONS_N_TEXTONS
Definition textons.c:73

DictionaryTrainingYUV
void DictionaryTrainingYUV(uint8_t *frame, uint16_t width, uint16_t height)
Function that performs one pass for dictionary training.
Definition textons.c:227

dictionary_ready
uint8_t dictionary_ready
Definition textons.c:132

dictionary_logger
static FILE * dictionary_logger
Definition textons.c:136

n_samples_image
uint32_t n_samples_image
Definition textons.c:125

learned_samples
uint32_t learned_samples
Definition textons.c:40

get_entropy
float get_entropy(float *p_dist, int D)
Function that calculates a base-2 Shannon entropy for a probability distribution.
Definition textons.c:594

TEXTONS_DICTIONARY_PATH
#define TEXTONS_DICTIONARY_PATH
Definition textons.c:113

dictionary_initialized
uint8_t dictionary_initialized
Definition textons.c:41

dictionary
float **** dictionary
Definition textons.c:39

alpha_uint
uint8_t alpha_uint
Definition textons.c:121

MAX_N_TEXTONS
#define MAX_N_TEXTONS
Definition textons.c:44

TEXTONS_LOAD_DICTIONARY
#define TEXTONS_LOAD_DICTIONARY
Definition textons.c:58

reinitialize_dictionary
uint8_t reinitialize_dictionary
Definition textons.c:120

alpha
float alpha
Definition textons.c:133

TEXTONS_BORDER_HEIGHT
#define TEXTONS_BORDER_HEIGHT
Definition textons.c:103

textons_stop
void textons_stop(void)
Definition textons.c:583

textons_init
void textons_init(void)
Initialize.
Definition textons.c:562

DistributionExtraction
void DistributionExtraction(uint8_t *frame, uint16_t width, uint16_t height)
Function that extracts a texton histogram from an image.
Definition textons.c:372

border_width
uint32_t border_width
Definition textons.c:127

border_height
uint32_t border_height
Definition textons.c:128

TEXTONS_N_LEARNING_SAMPLES
#define TEXTONS_N_LEARNING_SAMPLES
Definition textons.c:88

TEXTONS_BORDER_WIDTH
#define TEXTONS_BORDER_WIDTH
Definition textons.c:98

dictionary_number
uint8_t dictionary_number
Definition textons.c:129

TEXTONS_RUN
#define TEXTONS_RUN
Definition textons.c:48

TEXTONS_N_SAMPLES
#define TEXTONS_N_SAMPLES
Definition textons.c:78

TEXTONS_REINITIALIZE_DICTIONARY
#define TEXTONS_REINITIALIZE_DICTIONARY
Definition textons.c:63

texton_func
struct image_t * texton_func(struct image_t *img, UNUSED uint8_t p)
Main texton processing function that first either loads or learns a dictionary and then extracts the ...
Definition textons.c:144

running
uint8_t running
Definition textons.c:118

TEXTONS_FULL_SAMPLING
#define TEXTONS_FULL_SAMPLING
Definition textons.c:93

textons.h
Takes an image and represents the texture and colors in the image with a texton histogram.

D
static float D
Definition trilateration.c:35

uint16_t
unsigned short uint16_t
Typedef defining 16 bit unsigned short type.
Definition vl53l1_types.h:88

uint32_t
unsigned int uint32_t
Typedef defining 32 bit unsigned int type.
Definition vl53l1_types.h:78

uint8_t
unsigned char uint8_t
Typedef defining 8 bit unsigned char type.
Definition vl53l1_types.h:98