v5.14/textons_8c_source.html

 /*

  * Copyright (C) 2016, Hann Woei Ho, Guido de Croon

  *

  * This file is part of Paparazzi.

  *

  * Paparazzi is free software; you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation; either version 2, or (at your option)

  * any later version.

  *

  * Paparazzi is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

  * GNU General Public License for more details.

  *

  * You should have received a copy of the GNU General Public License

  * along with Paparazzi; see the file COPYING.  If not, write to

  * the Free Software Foundation, 59 Temple Place - Suite 330,

  * Boston, MA 02111-1307, USA.

  */


 #include <stdlib.h>

 #include <stdio.h>

 #include "modules/computer_vision/cv.h"

 #include "modules/computer_vision/textons.h"


 float ** **dictionary;

 uint32_t learned_samples = 0;

 uint8_t dictionary_initialized = 0;

 float *texton_distribution;


 // initial settings:

 #ifndef TEXTONS_LOAD_DICTIONARY

 #define TEXTONS_LOAD_DICTIONARY 1

 #endif

 PRINT_CONFIG_VAR(TEXTONS_LOAD_DICTIONARY)


 #ifndef TEXTONS_ALPHA

 #define TEXTONS_ALPHA 10

 #endif

 PRINT_CONFIG_VAR(TEXTONS_ALPHA)


 #ifndef TEXTONS_N_TEXTONS

 #define TEXTONS_N_TEXTONS 20

 #endif

 PRINT_CONFIG_VAR(TEXTONS_N_TEXTONS)


 #ifndef TEXTONS_N_SAMPLES

 #define TEXTONS_N_SAMPLES 100

 #endif

 PRINT_CONFIG_VAR(TEXTONS_N_SAMPLES)


 #ifndef TEXTONS_PATCH_SIZE

 #define TEXTONS_PATCH_SIZE 6

 #endif

 PRINT_CONFIG_VAR(TEXTONS_PATCH_SIZE)


 #ifndef TEXTONS_N_LEARNING_SAMPLES

 #define TEXTONS_N_LEARNING_SAMPLES 10000

 #endif

 PRINT_CONFIG_VAR(TEXTONS_N_LEARNING_SAMPLES)


 #ifndef TEXTONS_FULL_SAMPLING

 #define TEXTONS_FULL_SAMPLING 0

 #endif

 PRINT_CONFIG_VAR(TEXTONS_FULL_SAMPLING)


 #ifndef TEXTONS_BORDER_WIDTH

 #define TEXTONS_BORDER_WIDTH 0

 #endif

 PRINT_CONFIG_VAR(TEXTONS_BORDER_WIDTH)


 #ifndef TEXTONS_BORDER_HEIGHT

 #define TEXTONS_BORDER_HEIGHT 0

 #endif

 PRINT_CONFIG_VAR(TEXTONS_BORDER_HEIGHT)


 #ifndef TEXTONS_DICTIONARY_NUMBER

 #define TEXTONS_DICTIONARY_NUMBER 0

 #endif

 PRINT_CONFIG_VAR(TEXTONS_DICTIONARY_NUMBER)


 uint8_t load_dictionary = TEXTONS_LOAD_DICTIONARY;

 uint8_t alpha_uint = TEXTONS_ALPHA;

 uint8_t n_textons = TEXTONS_N_TEXTONS;

 uint8_t patch_size = TEXTONS_PATCH_SIZE;

 uint32_t n_learning_samples = TEXTONS_N_LEARNING_SAMPLES;

 uint32_t n_samples_image = TEXTONS_N_SAMPLES;

 uint8_t FULL_SAMPLING = TEXTONS_FULL_SAMPLING;

 uint32_t border_width = TEXTONS_BORDER_WIDTH;

 uint32_t border_height = TEXTONS_BORDER_HEIGHT;

 uint8_t dictionary_number = TEXTONS_DICTIONARY_NUMBER;


 // status variables

 uint8_t dictionary_ready = 0;

 float alpha = 0.0;


 // File pointer for saving the dictionary

 static FILE *dictionary_logger = NULL;

 #ifndef DICTIONARY_PATH

 #define DICTIONARY_PATH /data/video/

 #endif


 struct image_t *texton_func(struct image_t *img);

 struct image_t *texton_func(struct image_t *img)

 {


   if (img->buf_size == 0) { return img; }


   // extract frame from img struct:

   uint8_t *frame = (uint8_t *)img->buf;


   // if patch size odd, correct:

   if (patch_size % 2 == 1) { patch_size++; }


   // if dictionary not initialized:

   if (dictionary_ready == 0) {

     if (load_dictionary == 0) {

       // Train the dictionary:

       DictionaryTrainingYUV(frame, img->w, img->h);


       // After a number of samples, stop learning:

       if (learned_samples >= n_learning_samples) {

         // Save the dictionary:

         save_texton_dictionary();

         // stop learning:

         dictionary_ready = 1;

         // lower learning rate

         alpha = 0.0;

       }

     } else {

       // Load the dictionary:

       load_texton_dictionary();

     }

   } else {

     // Extract distributions

     DistributionExtraction(frame, img->w, img->h);

   }


   return img; // Colorfilter did not make a new image

 }


 void DictionaryTrainingYUV(uint8_t *frame, uint16_t width, uint16_t height)

 {

   int i, j, w, s, texton, c; // iterators

   int x, y; // image coordinates

   float error_texton; // distance between an image patch and a texton


   uint8_t *buf;


   // ***********************

   //   DICTIONARY LEARNING

   // ***********************


   if (!dictionary_initialized) {

     // **************

     // INITIALISATION

     // **************


     printf("Intializing dictionary!\n");


     // in the first image, we initialize the textons to random patches in the image

     for (w = 0; w < n_textons; w++) {

       // select a coordinate

       x = rand() % (width - patch_size);

       y = rand() % (height - patch_size);


       //printf("(x,y) = (%d,%d), (w,h) = (%d,%d), ps = %d\n", x, y, width, height, patch_size);

       // take the sample

       for (i = 0; i < patch_size; i++) {

         buf = frame + (width * 2 * (i + y)) + 2 * x;

         for (j = 0; j < patch_size; j++) {

           // put it in a texton

           printf("Setting dictionary:\n");

           // U/V component


           dictionary[w][i][j][0] = (float) * buf;

           buf += 1;

           // Y1/Y2 component

           dictionary[w][i][j][1] = (float) * buf;

           buf += 1;

           printf("Done!\n");

         }

       }

     }

     dictionary_initialized = 1;

   } else {

     // ********

     // LEARNING

     // ********

     printf("Learning!");

     alpha = ((float) alpha_uint) / 255.0;


     float *texton_distances, * **patch;

     texton_distances = (float *)calloc(n_textons, sizeof(float));

     patch = (float ** *)calloc(patch_size, sizeof(float **));


     for (i = 0; i < patch_size; i++) {

       patch[i] = (float **)calloc(patch_size, sizeof(float *));

       for (j = 0; j < patch_size; j++) {

         patch[i][j] = (float *)calloc(2, sizeof(float));

       }

     }


     // Extract and learn from n_samples_image per image

     for (s = 0; s < n_samples_image; s++) {

       // select a random sample from the image

       x = rand() % (width - patch_size);

       y = rand() % (height - patch_size);


       // reset texton_distances

       for (texton = 0; texton < n_textons; texton++) {

         texton_distances[texton] = 0;

       }


       // extract sample

       for (i = 0; i < patch_size; i++) {

         buf = frame + (width * 2 * (i + y)) + 2 * x;

         for (j = 0; j < patch_size; j++) {

           // U/V component

           patch[i][j][0] = (float) * buf;

           buf += 1;

           // Y1/Y2 component

           patch[i][j][1] = (float) * buf;

           buf += 1;

         }

       }


       // determine distances to the textons:

       for (i = 0; i < patch_size; i++) {

         for (j = 0; j < patch_size; j++) {

           for (c = 0; c < 2; c++) {

             // determine the distance to textons

             for (texton = 0; texton < n_textons; texton++) {

               texton_distances[texton] += (patch[i][j][c] - dictionary[texton][i][j][c])

                                           * (patch[i][j][c] - dictionary[texton][i][j][c]);

             }

           }

         }

       }


       // search the closest texton

       int assignment = 0;

       float min_dist = texton_distances[0];

       for (texton = 1; texton < n_textons; texton++) {

         if (texton_distances[texton] < min_dist) {

           min_dist = texton_distances[texton];

           assignment = texton;

         }

       }


       // move the neighbour closer to the input

       for (i = 0; i < patch_size; i++) {

         for (j = 0; j < patch_size; j++) {

           for (c = 0; c < 2; c++) {

             error_texton = patch[i][j][c] - dictionary[assignment][i][j][c];

             dictionary[assignment][i][j][c] += (alpha * error_texton);

           }

         }

       }


       // Augment the number of learned samples:

       learned_samples++;

     }


     // Free the allocated memory:

     for (i = 0; i < patch_size; i++) {

       for (j = 0; j < patch_size; j++) {

         free(patch[i][j]);

       }

       free(patch[i]);

     }

     free(patch);

     free(texton_distances);

   }


   // Free the buffer

   buf = NULL;

   free(buf);

 }


 void DistributionExtraction(uint8_t *frame, uint16_t width, uint16_t height)

 {

   int i, j, texton, c; // iterators

   int x, y; // coordinates

   int n_extracted_textons = 0;


   uint8_t *buf;


   // ************************

   //       EXECUTION

   // ************************


   printf("Execute!\n");


   // Allocate memory for texton distances and image patch:

   float *texton_distances, * **patch;

   texton_distances = (float *)calloc(n_textons, sizeof(float));

   patch = (float ** *)calloc(patch_size, sizeof(float **));

   for (i = 0; i < patch_size; i++) {

     patch[i] = (float **)calloc(patch_size, sizeof(float *));

     for (j = 0; j < patch_size; j++) {

       patch[i][j] = (float *)calloc(2, sizeof(float));

     }

   }


   int finished = 0;

   x = 0;

   y = 0;

   while (!finished) {

     if (!FULL_SAMPLING) {

       x = border_width + rand() % (width - patch_size - 2 * border_width);

       y = border_height + rand() % (height - patch_size - 2 * border_height);

     }


     // reset texton_distances

     for (texton = 0; texton < n_textons; texton++) {

       texton_distances[texton] = 0;

     }


     // extract sample

     for (i = 0; i < patch_size; i++) {

       buf = frame + (width * 2 * (i + y)) + 2 * x;

       for (j = 0; j < patch_size; j++) {

         // U/V component

         patch[i][j][0] = (float) * buf;

         buf += 1;

         // Y1/Y2 component

         patch[i][j][1] = (float) * buf;

         buf += 1;

       }

     }


     // determine distances:

     for (i = 0; i < patch_size; i++) {

       for (j = 0; j < patch_size; j++) {

         for (c = 0; c < 2; c++) {

           // determine the distance to words

           for (texton = 0; texton < n_textons; texton++) {

             texton_distances[texton] += (patch[i][j][c] - dictionary[texton][i][j][c])

                                         * (patch[i][j][c] - dictionary[texton][i][j][c]);

           }

         }

       }

     }


     // determine the nearest neighbour

     // search the closest centroid

     int assignment = 0;

     float min_dist = texton_distances[0];

     for (texton = 1; texton < n_textons; texton++) {

       if (texton_distances[texton] < min_dist) {

         min_dist = texton_distances[texton];

         assignment = texton;

       }

     }


     // put the assignment in the histogram

     texton_distribution[assignment]++;

     n_extracted_textons++;


     if (!FULL_SAMPLING && n_extracted_textons == n_samples_image) {

       finished = 1;

     } else {

       // FULL_SAMPLING is actually a sampling that covers the image:

       y += patch_size;

       // True full sampling would require:

       // y++;


       if (y > height - patch_size) {

         if (!FULL_SAMPLING) {

           x += patch_size;

         } else {

           x++;

         }

         y = 0;

       }

       if (x > width - patch_size) {

         finished = 1;

       }

     }

   }


   // Normalize distribution:

   for (i = 0; i < n_textons; i++) {

     texton_distribution[i] = texton_distribution[i] / (float) n_extracted_textons;

     // printf("textons[%d] = %f\n", i, texton_distribution[i]);

   }

   // printf("\n");


   // free memory:

   for (i = 0; i < patch_size; i++) {

     for (j = 0; j < patch_size; j++) {

       free(patch[i][j]);

     }

     free(patch[i]);

   }

   free(patch);

   free(texton_distances);


   buf = NULL;

   free(buf);


 } // EXECUTION


 void save_texton_dictionary(void)

 {

   //save a dictionary

   char filename[512];


   // Check for available files

   sprintf(filename, "%s/Dictionary_%05d.dat", STRINGIFY(DICTIONARY_PATH), dictionary_number);


   dictionary_logger = fopen(filename, "w");


   if (dictionary_logger == NULL) {

     perror("Error while opening the file.\n");

   } else {

     // (over-)write dictionary

     for (uint8_t i = 0; i < n_textons; i++) {

       for (uint8_t j = 0; j < patch_size; j++) {

         for (uint8_t k = 0; k < patch_size; k++) {

           fprintf(dictionary_logger, "%f\n", dictionary[i][j][k][0]);

           fprintf(dictionary_logger, "%f\n", dictionary[i][j][k][1]);

         }

       }

     }

     fclose(dictionary_logger);

   }


 }


 void load_texton_dictionary(void)

 {

   char filename[512];

   sprintf(filename, "%s/Dictionary_%05d.dat", STRINGIFY(DICTIONARY_PATH), dictionary_number);


   if ((dictionary_logger = fopen(filename, "r"))) {

     // Load the dictionary:

     for (int i = 0; i < n_textons; i++) {

       for (int j = 0; j < patch_size; j++) {

         for (int k = 0; k < patch_size; k++) {

           if (fscanf(dictionary_logger, "%f\n", &dictionary[i][j][k][0]) == EOF) { break; }

           if (fscanf(dictionary_logger, "%f\n", &dictionary[i][j][k][1]) == EOF) { break; }

         }

       }

     }


     fclose(dictionary_logger);

     dictionary_ready = 1;

   } else {

     // If the given dictionary does not exist, we start learning one:

     printf("Texton dictionary %d does not exist, we start learning one.\n", dictionary_number);

     load_dictionary = 0;

     learned_samples = 0;

     dictionary_initialized = 0;

   }

 }


 void textons_init(void)

 {

   printf("Textons init\n");

   texton_distribution = (float *)calloc(n_textons, sizeof(float));

   dictionary_initialized = 0;

   learned_samples = 0;

   dictionary_ready = 0;

   dictionary = (float ** **)calloc(n_textons, sizeof(float ** *));

   for (int w = 0; w < n_textons; w++) {

     dictionary[w] = (float ** *) calloc(patch_size, sizeof(float **));

     for (int i = 0; i < patch_size; i++) {

       dictionary[w][i] = (float **) calloc(patch_size, sizeof(float *));

       for (int j = 0; j < patch_size; j++) {

         dictionary[w][i][j] = (float *) calloc(2, sizeof(float));

       }

     }

   }


   cv_add(texton_func);

 }


 void textons_stop(void)

 {

   free(texton_distribution);

   free(dictionary);

 }


n_samples_image
uint32_t n_samples_image
Definition: textons.c:99

uint16_t
unsigned short uint16_t
Definition: types.h:16

load_dictionary
uint8_t load_dictionary
Definition: textons.c:94

TEXTONS_PATCH_SIZE
#define TEXTONS_PATCH_SIZE
Definition: textons.c:64

image_t::buf_size
uint32_t buf_size
The buffer size.
Definition: image.h:52

border_height
uint32_t border_height
Definition: textons.c:102

TEXTONS_FULL_SAMPLING
#define TEXTONS_FULL_SAMPLING
Definition: textons.c:74

alpha
float alpha
Definition: textons.c:107

image_t
Definition: image.h:43

border_width
uint32_t border_width
Definition: textons.c:101

patch_size
uint8_t patch_size
Definition: textons.c:97

dictionary_number
uint8_t dictionary_number
Definition: textons.c:103

textons.h
Takes an image and represents the texture and colors in the image with a texton histogram.

DistributionExtraction
void DistributionExtraction(uint8_t *frame, uint16_t width, uint16_t height)
Function that extracts a texton histogram from an image.
Definition: textons.c:311

EOF
#define EOF
Definition: usb_ser_hw.c:87

TEXTONS_DICTIONARY_NUMBER
#define TEXTONS_DICTIONARY_NUMBER
Definition: textons.c:89

save_texton_dictionary
void save_texton_dictionary(void)
Save the texton dictionary.
Definition: textons.c:441

textons_init
void textons_init(void)
Initialize.
Definition: textons.c:501

TEXTONS_LOAD_DICTIONARY
#define TEXTONS_LOAD_DICTIONARY
Definition: textons.c:44

n_learning_samples
uint32_t n_learning_samples
Definition: textons.c:98

alpha_uint
uint8_t alpha_uint
Definition: textons.c:95

TEXTONS_ALPHA
#define TEXTONS_ALPHA
Definition: textons.c:49

load_texton_dictionary
void load_texton_dictionary(void)
Load a texton dictionary.
Definition: textons.c:471

image_t::w
uint16_t w
Image width.
Definition: image.h:45

uint32_t
unsigned long uint32_t
Definition: types.h:18

cv.h
Computer vision framework for onboard processing.

image_t::h
uint16_t h
Image height.
Definition: image.h:46

textons_stop
void textons_stop(void)
Definition: textons.c:522

image_t::buf
void * buf
Image buffer (depending on the image_type)
Definition: image.h:53

n_textons
uint8_t n_textons
Definition: textons.c:96

TEXTONS_N_TEXTONS
#define TEXTONS_N_TEXTONS
Definition: textons.c:54

TEXTONS_N_LEARNING_SAMPLES
#define TEXTONS_N_LEARNING_SAMPLES
Definition: textons.c:69

uint8_t
unsigned char uint8_t
Definition: types.h:14

dictionary_logger
static FILE * dictionary_logger
Definition: textons.c:110

dictionary
float **** dictionary
Definition: textons.c:37

dictionary_ready
uint8_t dictionary_ready
Definition: textons.c:106

texton_func
struct image_t * texton_func(struct image_t *img)
Main texton processing function that first either loads or learns a dictionary and then extracts the ...
Definition: textons.c:121

dictionary_initialized
uint8_t dictionary_initialized
Definition: textons.c:39

learned_samples
uint32_t learned_samples
Definition: textons.c:38

FULL_SAMPLING
uint8_t FULL_SAMPLING
Definition: textons.c:100

TEXTONS_N_SAMPLES
#define TEXTONS_N_SAMPLES
Definition: textons.c:59

DICTIONARY_PATH
#define DICTIONARY_PATH
Definition: textons.c:112

TEXTONS_BORDER_WIDTH
#define TEXTONS_BORDER_WIDTH
Definition: textons.c:79

texton_distribution
float * texton_distribution
Definition: textons.c:40

DictionaryTrainingYUV
void DictionaryTrainingYUV(uint8_t *frame, uint16_t width, uint16_t height)
Function that performs one pass for dictionary training.
Definition: textons.c:166

TEXTONS_BORDER_HEIGHT
#define TEXTONS_BORDER_HEIGHT
Definition: textons.c:84