libmpcodecs/vf_remove_logo.c

   1 /*
   2 Copyright 2005 Robert Edele.
   3
   4 e-mail: yartrebo@earthlink.net
   5
   6 This program is free software; you can redistribute it and/or modify it
   7 under the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 2 of the License, or (at your option)
   9 any later version.
  10
  11 This program is distributed in the hope that it will be useful, but
  12 WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
  13 or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Public License for more
  14 details.
  15
  16 You should have reveived a copy of the GNU General Public License
  17 along with this program; if not, write to the
  18 Free Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
  19 02111-1307 USA
  20
  21 __________________________________________________________________________
  22 | Robert Edele                                           Fri. 4-Feb-2005 |
  23 | This program loads a .pgm mask file showing where a logo is and uses   |
  24 | a blur transform to remove the logo.                                   |
  25 |________________________________________________________________________|
  26 */
  27
  28 /**
  29  * \file vf_remove_logo.c
  30  *
  31  * \brief Advanced blur-based logo removing filter.
  32
  33  *     Hello and welcome. This code implements a filter to remove annoying TV
  34  * logos and other annoying images placed onto a video stream. It works by filling
  35  * in the pixels that comprise the logo with neighboring pixels. The transform is
  36  * very loosely based on a gaussian blur, but it is different enough to merit its
  37  * own paragraph later on. It is a major improvement on the old delogo filter as
  38  * it both uses a better blurring algorithm and uses a bitmap to use an arbitrary
  39  * and generally much tighter fitting shape than a rectangle.
  40  *
  41  *     The filter requires 1 argument and has no optional arguments. It requires
  42  * a filter bitmap, which must be in PGM or PPM format. A sample invocation would
  43  * be -vf remove_logo=/home/username/logo_bitmaps/xyz.pgm.  Pixels with a value of
  44  * zero are not part of the logo, and non-zero pixels are part of the logo. If you
  45  * use white (255) for the logo and black (0) for the rest, you will be safe. For
  46  * making the filter bitmap, I recommend taking a screen capture of a black frame
  47  * with the logo visible, and then using The GIMP's threshold filter followed by
  48  * the erode filter once or twice. If needed, little splotches can be fixed
  49  * manually. Remember that if logo pixels are not covered, the filter quality will
  50  * be much reduced. Marking too many pixels as part of the logo doesn't hurt as
  51  * much, but it will increase the amount of blurring needed to cover over the
  52  * image and will destroy more information than necessary. Additionally, this blur
  53  * algorithm is O(n) = n^4, where n is the width and height of a hypothetical
  54  * square logo, so extra pixels will slow things down on a large lo
  55  *
  56  *     The logo removal algorithm has two key points. The first is that it
  57  * distinguishes between pixels in the logo and those not in the logo by using the
  58  * passed-in bitmap. Pixels not in the logo are copied over directly without being
  59  * modified and they also serve as source pixels for the logo fill-in. Pixels
  60  * inside the logo have the mask applied.
  61  *
  62  *     At init-time the bitmap is reprocessed internally, and the distance to the
  63  * nearest edge of the logo (Manhattan distance), along with a little extra to
  64  * remove rough edges, is stored in each pixel. This is done using an in-place
  65  * erosion algorithm, and incrementing each pixel that survives any given erosion.
  66  * Once every pixel is eroded, the maximum value is recorded, and a set of masks
  67  * from size 0 to this size are generaged. The masks are circular binary masks,
  68  * where each pixel within a radius N (where N is the size of the mask) is a 1,
  69  * and all other pixels are a 0. Although a gaussian mask would be more
  70  * mathematically accurate, a binary mask works better in practice because we
  71  * generally do not use the central pixels in the mask (because they are in the
  72  * logo region), and thus a gaussian mask will cause too little blur and thus a
  73  * very unstable image.
  74  *
  75  *     The mask is applied in a special way. Namely, only pixels in the mask that
  76  * line up to pixels outside the logo are used. The dynamic mask size means that
  77  * the mask is just big enough so that the edges touch pixels outside the logo, so
  78  * the blurring is kept to a minimum and at least the first boundary condition is
  79  * met (that the image function itself is continuous), even if the second boundary
  80  * condition (that the derivative of the image function is continuous) is not met.
  81  * A masking algorithm that does preserve the second boundary coundition
  82  * (perhaps something based on a highly-modified bi-cubic algorithm) should offer
  83  * even better results on paper, but the noise in a typical TV signal should make
  84  * anything based on derivatives hopelessly noisy.
  85  */
  86
  87 #include <stdio.h>
  88 #include <stdlib.h>
  89 #include <string.h>
  90 #include <ctype.h>
  91 #include <inttypes.h>
  92
  93 #include "config.h"
  94 #include "mp_msg.h"
  95 #include "libvo/fastmemcpy.h"
  96
  97 #include "img_format.h"
  98 #include "mp_image.h"
  99 #include "vf.h"
 100
 101 //===========================================================================//
 102
 103 /** \brief Returns the larger of the two arguments. **/
 104 #define max(x,y) ((x)>(y)?(x):(y))
 105 /** \brief Returns the smaller of the two arguments. **/
 106 #define min(x,y) ((x)>(y)?(y):(x))
 107
 108 /**
 109  * \brief Test if a pixel is part of the logo.
 110  */
 111 #define test_filter(image, x, y) ((unsigned char) (image->pixel[((y) * image->width) + (x)]))
 112
 113 /**
 114  * \brief Chooses a slightly larger mask size to improve performance.
 115  *
 116  * This function maps the absolute minimum mask size needed to the mask size we'll
 117  * actually use. f(x) = x (the smallest that will work) will produce the sharpest
 118  * results, but will be quite jittery. f(x) = 1.25x (what I'm using) is a good
 119  * tradeoff in my opinion. This will calculate only at init-time, so you can put a
 120  * long expression here without effecting performance.
 121  */
 122 #define apply_mask_fudge_factor(x) (((x) >> 2) + x)
 123
 124 /**
 125  * \brief Simple implementation of the PGM image format.
 126  *
 127  * This struct holds a bare-bones image loaded from a PGM or PPM file. Once
 128  * loaded and pre-processed, each pixel in this struct will contain how far from
 129  * the edge of the logo each pixel is, using the manhattan distance (|dx| + |dy|).
 130  *
 131  * pixels in char * pixel can be addressed using (y * width) + height.
 132  */
 133 typedef struct
 134 {
 135   unsigned int width;
 136   unsigned int height;
 137
 138   unsigned char * pixel;
 139
 140 } pgm_structure;
 141
 142 /**
 143  * \brief Stores persistant variables.
 144  *
 145  * Variables stored here are kept from frame to frame, and seperate instances of
 146  * the filter will get their own seperate copies.
 147  */
 148 typedef struct
 149 {
 150   unsigned int fmt; /* Not exactly sure of the use for this. It came with the example filter I used as a basis for this, and it looks like a lot of stuff will break if I remove it. */
 151   int max_mask_size; /* The largest possible mask size that will be needed with the given filter and corresponding half_size_filter. The half_size_filter can have a larger requirment in some rare (but not degenerate) cases. */
 152   int * * * mask; /* Stores our collection of masks. The first * is for an array of masks, the second for the y axis, and the third for the x axis. */
 153   pgm_structure * filter; /* Stores the full-size filter image. This is used to tell what pixels are in the logo or not in the luma plane. */
 154   pgm_structure * half_size_filter; /* Stores a 50% width and 50% height filter image. This is used to tell what pixels are in the logo or not in the chroma planes. */
 155   /* These 8 variables store the bounding rectangles that the logo resides in. */
 156   int bounding_rectangle_posx1;
 157   int bounding_rectangle_posy1;
 158   int bounding_rectangle_posx2;
 159   int bounding_rectangle_posy2;
 160   int bounding_rectangle_half_size_posx1;
 161   int bounding_rectangle_half_size_posy1;
 162   int bounding_rectangle_half_size_posx2;
 163   int bounding_rectangle_half_size_posy2;
 164 } vf_priv_s;
 165
 166 /**
 167  * \brief Mallocs memory and checks to make sure it succeeded.
 168  *
 169  * \param size How many bytes to allocate.
 170  *
 171  * \return A pointer to the freshly allocated memory block, or NULL on failutre.
 172  *
 173  * Mallocs memory, and checks to make sure it was successfully allocated. Because
 174  * of how MPlayer works, it cannot safely halt execution, but at least the user
 175  * will get an error message before the segfault happens.
 176  */
 177 void * safe_malloc(int size)
 178 {
 179   void * answer = malloc(size);
 180   if (answer == NULL)
 181     mp_msg(MSGT_VFILTER, MSGL_ERR, "Unable to allocate memory in vf_remove_logo.c\n");
 182
 183   return answer;
 184 }
 185
 186 /**
 187  * \brief Calculates the smallest rectangle that will encompass the logo region.
 188  *
 189  * \param filter This image contains the logo around which the rectangle will
 190  *        will be fitted.
 191  *
 192  * The bounding rectangle is calculated by testing successive lines (from the four
 193  * sides of the rectangle) until no more can be removed without removing logo
 194  * pixels. The results are returned by reference to posx1, posy1, posx2, and
 195  * posy2.
 196  */
 197
 198 void calculate_bounding_rectangle(int * posx1, int * posy1, int * posx2, int * posy2, pgm_structure * filter)
 199 {
 200   int x; /* Temporary variables to run  */
 201   int y; /* through each row or column. */
 202   int start_x;
 203   int start_y;
 204   int end_x = filter->width - 1;
 205   int end_y = filter->height - 1;
 206   int did_we_find_a_logo_pixel = 0;
 207
 208   /* Let's find the top bound first. */
 209   for (start_x = 0; start_x < filter->width && !did_we_find_a_logo_pixel; start_x++)
 210   {
 211     for (y = 0; y < filter->height; y++)
 212     {
 213       did_we_find_a_logo_pixel |= test_filter(filter, start_x, y);
 214     }
 215   }
 216   start_x--;
 217
 218   /* Now the bottom bound. */
 219   did_we_find_a_logo_pixel = 0;
 220   for (end_x = filter->width - 1; end_x > start_x && !did_we_find_a_logo_pixel; end_x--)
 221   {
 222     for (y = 0; y < filter->height; y++)
 223     {
 224       did_we_find_a_logo_pixel |= test_filter(filter, end_x, y);
 225     }
 226   }
 227   end_x++;
 228
 229   /* Left bound. */
 230   did_we_find_a_logo_pixel = 0;
 231   for (start_y = 0; start_y < filter->height && !did_we_find_a_logo_pixel; start_y++)
 232   {
 233     for (x = 0; x < filter->width; x++)
 234     {
 235       did_we_find_a_logo_pixel |= test_filter(filter, x, start_y);
 236     }
 237   }
 238   start_y--;
 239
 240   /* Right bound. */
 241   did_we_find_a_logo_pixel = 0;
 242   for (end_y = filter->height - 1; end_y > start_y && !did_we_find_a_logo_pixel; end_y--)
 243   {
 244     for (x = 0; x < filter->width; x++)
 245     {
 246       did_we_find_a_logo_pixel |= test_filter(filter, x, end_y);
 247     }
 248   }
 249   end_y++;
 250
 251   *posx1 = start_x;
 252   *posy1 = start_y;
 253   *posx2 = end_x;
 254   *posy2 = end_y;
 255
 256   return;
 257 }
 258
 259 /**
 260  * \brief Free mask memory.
 261  *
 262  * \param vf Data structure which stores our persistant data, and is to be freed.
 263  *
 264  * We call this function when our filter is done. It will free the memory
 265  * allocated to the masks and leave the variables in a safe state.
 266  */
 267 void destroy_masks(vf_instance_t * vf)
 268 {
 269   int a, b;
 270
 271   /* Load values from the vf->priv struct for faster dereferencing. */
 272   int * * * mask = ((vf_priv_s *)vf->priv)->mask;
 273   int max_mask_size = ((vf_priv_s *)vf->priv)->max_mask_size;
 274
 275   if (mask == NULL)
 276     return; /* Nothing allocated, so return before we segfault. */
 277
 278   /* Free all allocated memory. */
 279   for (a = 0; a <= max_mask_size; a++) /* Loop through each mask. */
 280   {
 281     for (b = -a; b <= a; b++) /* Loop through each scanline in a mask. */
 282     {
 283       free(mask[a][b + a]); /* Free a scanline. */
 284     }
 285     free(mask[a]); /* Free a mask. */
 286   }
 287   free(mask); /* Free the array of pointers pointing to the masks. */
 288
 289   /* Set the pointer to NULL, so that any duplicate calls to this function will not cause a crash. */
 290   ((vf_priv_s *)vf->priv)->mask = NULL;
 291
 292   return;
 293 }
 294
 295 /**
 296  * \brief Set up our array of masks.
 297  *
 298  * \param vf Where our filter stores persistance data, like these masks.
 299  *
 300  * This creates an array of progressively larger masks and calculates their
 301  * values. The values will not change during program execution once this function
 302  * is done.
 303  */
 304 void initialize_masks(vf_instance_t * vf)
 305 {
 306   int a, b, c;
 307
 308   /* Load values from the vf->priv struct for faster dereferencing. */
 309   int * * * mask = ((vf_priv_s *)vf->priv)->mask;
 310   int max_mask_size = ((vf_priv_s *)vf->priv)->max_mask_size; /* This tells us how many masks we'll need to generate. */
 311
 312   /* Create a circular mask for each size up to max_mask_size. When the filter is applied, the mask size is
 313      determined on a pixel by pixel basis, with pixels nearer the edge of the logo getting smaller mask sizes. */
 314   mask = (int * * *) safe_malloc(sizeof(int * *) * (max_mask_size + 1));
 315   for (a = 0; a <= max_mask_size; a++)
 316   {
 317     mask[a] = (int * *) safe_malloc(sizeof(int *) * ((a * 2) + 1));
 318     for (b = -a; b <= a; b++)
 319     {
 320       mask[a][b + a] = (int *) safe_malloc(sizeof(int) * ((a * 2) + 1));
 321       for (c = -a; c <= a; c++)
 322       {
 323         if ((b * b) + (c * c) <= (a * a)) /* Circular 0/1 mask. */
 324           mask[a][b + a][c + a] = 1;
 325         else
 326           mask[a][b + a][c + a] = 0;
 327       }
 328     }
 329   }
 330
 331   /* Store values back to vf->priv so they aren't lost after the function returns. */
 332   ((vf_priv_s *)vf->priv)->mask = mask;
 333
 334   return;
 335 }
 336
 337 /**
 338  * \brief Pre-processes an image to give distance information.
 339  *
 340  * \param vf Data structure that holds persistant information. All it is used for
 341              in this function is to store the calculated max_mask_size variable.
 342  * \param mask This image will be converted from a greyscale image into a
 343  *             distance image.
 344  *
 345  * This function takes a greyscale image (pgm_structure * mask) and converts it
 346  * in place into a distance image. A distance image is zero for pixels ourside of
 347  * the logo and is the manhattan distance (|dx| + |dy|) for pixels inside of the
 348  * logo. This will overestimate the distance, but that is safe, and is far easier
 349  * to implement than a proper pythagorean distance since I'm using a modified
 350  * erosion algorithm to compute the distances.
 351  */
 352 void convert_mask_to_strength_mask(vf_instance_t * vf, pgm_structure * mask)
 353 {
 354   int x, y; /* Used by our for loops to go through every single pixel in the picture one at a time. */
 355   int has_anything_changed = 1; /* Used by the main while() loop to know if anything changed on the last erosion. */
 356   int current_pass = 0; /* How many times we've gone through the loop. Used in the in-place erosion algorithm
 357                            and to get us max_mask_size later on. */
 358   int max_mask_size; /* This will record how large a mask the pixel that is the furthest from the edge of the logo
 359                            (and thus the neediest) is. */
 360   char * current_pixel = mask->pixel; /* This stores the actual pixel data. */
 361
 362   /* First pass, set all non-zero values to 1. After this loop finishes, the data should be considered numeric
 363      data for the filter, not color data. */
 364   for (x = 0; x < mask->height * mask->width; x++, current_pixel++)
 365     if(*current_pixel) *current_pixel = 1;
 366
 367   /* Second pass and future passes. For each pass, if a pixel is itself the same value as the current pass,
 368      and its four neighbors are too, then it is incremented. If no pixels are incremented by the end of the pass,
 369      then we go again. Edge pixels are counted as always excluded (this should be true anyway for any sane mask,
 370      but if it isn't this will ensure that we eventually exit). */
 371   while (has_anything_changed)
 372   {
 373     current_pass++;
 374     current_pixel = mask->pixel;
 375
 376     has_anything_changed = 0; /* If this doesn't get set by the end of this pass, then we're done. */
 377
 378     for (y = 1; y < mask->height - 1; y++)
 379     {
 380       for (x = 1; x < mask->width - 1; x++)
 381       {
 382         /* Apply the in-place erosion transform. It is based on the following two premises: 1 - Any pixel that fails 1 erosion
 383            will fail all future erosions. 2 - Only pixels having survived all erosions up to the present will be >= to
 384            current_pass. It doesn't matter if it survived the current pass, failed it, or hasn't been tested yet. */
 385         if (*current_pixel >= current_pass && /* By using >= instead of ==, we allow the algorithm to work in place. */
 386             *(current_pixel + 1) >= current_pass &&
 387             *(current_pixel - 1) >= current_pass &&
 388             *(current_pixel + mask->width) >= current_pass &&
 389             *(current_pixel - mask->width) >= current_pass)
 390          {
 391            (*current_pixel)++; /* Increment the value since it still has not been eroded, as evidenced by the if statement
 392                                   that just evaluated to true. */
 393            has_anything_changed = 1;
 394          }
 395         current_pixel++;
 396       }
 397     }
 398   }
 399
 400   /* Apply the fudge factor, which will increase the size of the mask a little to reduce jitter at the cost of more blur. */
 401   for (y = 1; y < mask->height - 1; y++)
 402   {
 403    for (x = 1; x < mask->width - 1; x++)
 404     {
 405       mask->pixel[(y * mask->width) + x] = apply_mask_fudge_factor(mask->pixel[(y * mask->width) + x]);
 406     }
 407   }
 408
 409   max_mask_size = current_pass + 1; /* As a side-effect, we now know the maximum mask size, which we'll use to generate our masks. */
 410   max_mask_size = apply_mask_fudge_factor(max_mask_size); /* Apply the fudge factor to this number too, since we must
 411                                                              ensure that enough masks are generated. */
 412   ((vf_priv_s *)vf->priv)->max_mask_size = max_mask_size; /* Commit the newly calculated max_mask_size to the vf->priv struct. */
 413
 414   return;
 415 }
 416
 417 /**
 418  * \brief Our blurring function.
 419  *
 420  * \param vf Stores persistant data. In this function we are interested in the
 421  *           array of masks.
 422  * \param value_out The properly blurred and delogoed pixel is outputted here.
 423  * \param logo_mask Tells us which pixels are in the logo and which aren't.
 424  * \param image The image that is having its logo removed.
 425  * \param x x-coordinate of the pixel to blur.
 426  * \param y y-coordinate of the pixel to blur.
 427  * \param plane 0 = luma, 1 = blue chroma, 2 = red chroma (YUV).
 428  *
 429  * This function is the core of the filter. It takes a pixel that is inside the
 430  * logo and blurs it. It does so by finding the average of all the pixels within
 431  * the mask and outside of the logo.
 432  */
 433 void get_blur(const vf_instance_t * const vf, unsigned int * const value_out, const pgm_structure * const logo_mask,
 434               const mp_image_t * const image, const int x, const int y, const int plane)
 435 {
 436   int mask_size; /* Mask size tells how large a circle to use. The radius is about (slightly larger than) mask size. */
 437   /* Get values from vf->priv for faster dereferencing. */
 438   int * * * mask = ((vf_priv_s *)vf->priv)->mask;
 439
 440   int start_posx, start_posy, end_posx, end_posy;
 441   int i, j;
 442   unsigned int accumulator = 0, divisor = 0;
 443   const unsigned char * mask_read_position; /* What pixel we are reading out of the circular blur mask. */
 444   const unsigned char * logo_mask_read_position; /* What pixel we are reading out of the filter image. */
 445
 446   /* Prepare our bounding rectangle and clip it if need be. */
 447   mask_size = test_filter(logo_mask, x, y);
 448   start_posx = max(0, x - mask_size);
 449   start_posy = max(0, y - mask_size);
 450   end_posx = min(image->width - 1, x + mask_size);
 451   end_posy = min(image->height - 1, y + mask_size);
 452
 453   mask_read_position = image->planes[plane] + (image->stride[plane] * start_posy) + start_posx;
 454   logo_mask_read_position = logo_mask->pixel + (start_posy * logo_mask->width) + start_posx;
 455
 456   for (j = start_posy; j <= end_posy; j++)
 457   {
 458     for (i = start_posx; i <= end_posx; i++)
 459     {
 460       if (!(*logo_mask_read_position) && mask[mask_size][i - start_posx][j - start_posy])
 461       { /* Check to see if this pixel is in the logo or not. Only use the pixel if it is not. */
 462         accumulator += *mask_read_position;
 463         divisor++;
 464       }
 465
 466       mask_read_position++;
 467       logo_mask_read_position++;
 468     }
 469
 470     mask_read_position += (image->stride[plane] - ((end_posx + 1) - start_posx));
 471     logo_mask_read_position += (logo_mask->width - ((end_posx + 1) - start_posx));
 472   }
 473
 474   if (divisor == 0) /* This means that not a single pixel is outside of the logo, so we have no data. */
 475   { /* We should put some eye catching value here, to indicate the flaw to the user. */
 476     *value_out = 255;
 477   }
 478   else /* Else we need to normalise the data using the divisor. */
 479   {
 480     *value_out = (accumulator + (divisor / 2)) / divisor; /* Divide, taking into account average rounding error. */
 481   }
 482
 483   return;
 484 }
 485
 486 /**
 487  * \brief Free a pgm_structure. Undoes load_pgm(...).
 488  */
 489 void destroy_pgm(pgm_structure * to_be_destroyed)
 490 {
 491   if (to_be_destroyed == NULL)
 492     return; /* Don't do anything if a NULL pointer was passed it. */
 493
 494   /* Internally allocated memory. */
 495   if (to_be_destroyed->pixel != NULL)
 496   {
 497     free(to_be_destroyed->pixel);
 498     to_be_destroyed->pixel = NULL;
 499   }
 500
 501   /* Free the actual struct instance. This is done here and not by the calling function. */
 502   free(to_be_destroyed);
 503 }
 504
 505 /** \brief Helper function for load_pgm(...) to skip whitespace. */
 506 void load_pgm_skip(FILE *f) {
 507   int c, comment = 0;
 508   do {
 509     c = fgetc(f);
 510     if (c == '#')
 511       comment = 1;
 512     if (c == '\n')
 513       comment = 0;
 514   } while (c != EOF && (isspace(c) || comment));
 515   ungetc(c, f);
 516 }
 517
 518 #define REMOVE_LOGO_LOAD_PGM_ERROR_MESSAGE(message) {mp_msg(MSGT_VFILTER, MSGL_ERR, message); return NULL;}
 519
 520 /**
 521  * \brief Loads a raw pgm or ppm file into a newly created pgm_structure object.
 522  *
 523  * \param file_name The name of the file to be loaded. So long as the file is a
 524  *                  valid pgm or ppm file, it will load correctly, even if the
 525  *                  extension is missing or invalid.
 526  *
 527  * \return A pointer to the newly created pgm_structure object. Don't forget to
 528  *         call destroy_pgm(...) when you're done with this. If an error occurs,
 529  *         NULL is returned.
 530  *
 531  * Can load either raw pgm (P5) or raw ppm (P6) image files as a binary image.
 532  * While a pgm file will be loaded normally (greyscale), the only thing that is
 533  * guaranteed with ppm is that all zero (R = 0, G = 0, B = 0) pixels will remain
 534  * zero, and non-zero pixels will remain non-zero.
 535  */
 536 pgm_structure * load_pgm(const char * file_name)
 537 {
 538   unsigned char flags;
 539   int x, y;
 540   int maximum_greyscale_value;
 541   FILE * input;
 542   int pnm_number;
 543   pgm_structure * new_pgm = (pgm_structure *) safe_malloc (sizeof(pgm_structure));
 544   char * write_position;
 545   char * end_position;
 546   int image_size; /* width * height */
 547
 548   if((input = fopen(file_name, "rb")) == NULL) REMOVE_LOGO_LOAD_PGM_ERROR_MESSAGE("[vf]remove-logo: Unable to open file. File not found or insufficient permissions.\n");
 549
 550   /* Parse the PGM header. */
 551   if (fgetc(input) != 'P') REMOVE_LOGO_LOAD_PGM_ERROR_MESSAGE("[vf]remove-logo: File is not a valid PGM or PPM file.\n");
 552   pnm_number = fgetc(input) - '0';
 553   if (pnm_number != 5 && pnm_number != 6) REMOVE_LOGO_LOAD_PGM_ERROR_MESSAGE("[vf]remove-logo: Invalid PNM file. Only raw PGM (Portable Gray Map) and raw PPM (Portable Pixel Map) subtypes are allowed.\n");
 554   load_pgm_skip(input);
 555   if (fscanf(input, "%i", &(new_pgm->width)) != 1) REMOVE_LOGO_LOAD_PGM_ERROR_MESSAGE("[vf]remove-logo: Invalid PGM/PPM header.\n");
 556   load_pgm_skip(input);
 557   if (fscanf(input, "%i", &(new_pgm->height)) != 1) REMOVE_LOGO_LOAD_PGM_ERROR_MESSAGE("[vf]remove-logo: Invalid PGM/PPM header.\n");
 558   load_pgm_skip(input);
 559   if (fscanf(input, "%i", &maximum_greyscale_value) != 1) REMOVE_LOGO_LOAD_PGM_ERROR_MESSAGE("[vf]remove-logo: Invalid PGM/PPM header.\n");
 560   if (maximum_greyscale_value >= 256) REMOVE_LOGO_LOAD_PGM_ERROR_MESSAGE("[vf]remove_logo: Only 1 byte per pixel (pgm) or 1 byte per color value (ppm) are supported.\n");
 561   load_pgm_skip(input);
 562
 563   new_pgm->pixel = (unsigned char *) safe_malloc (sizeof(unsigned char) * new_pgm->width * new_pgm->height);
 564
 565   /* Load the pixels. */
 566   /* Note: I am aware that fgetc(input) isn't the fastest way of doing things, but it is quite compact and the code only runs once when the filter is initialized.*/
 567   image_size = new_pgm->width * new_pgm->height;
 568   end_position = new_pgm->pixel + image_size;
 569   for (write_position = new_pgm->pixel; write_position < end_position; write_position++)
 570   {
 571     *write_position = fgetc(input);
 572     if (pnm_number == 6) /* This tests to see if the file is a PPM file. */
 573     { /* If it is, then consider the pixel set if any of the three color channels are set. Since we just care about == 0 or != 0, a bitwise or will do the trick. */
 574       *write_position |= fgetc(input);
 575       *write_position |= fgetc(input);
 576     }
 577   }
 578
 579   return new_pgm;
 580 }
 581
 582 /**
 583  * \brief Generates a scaled down image with half width, height, and intensity.
 584  *
 585  * \param vf Our struct for persistant data. In this case, it is used to update
 586  *           mask_max_size with the larger of the old or new value.
 587  * \param input_image The image from which the new half-sized one will be based.
 588  *
 589  * \return The newly allocated and shrunken image.
 590  *
 591  * This function not only scales down an image, but halves the value in each pixel
 592  * too. The purpose of this is to produce a chroma filter image out of a luma
 593  * filter image. The pixel values store the distance to the edge of the logo and
 594  * halving the dimensions halves the distance. This function rounds up, because
 595  * a downwards rounding error could cause the filter to fail, but an upwards
 596  * rounding error will only cause a minor amount of excess blur in the chroma
 597  * planes.
 598  */
 599 pgm_structure * generate_half_size_image(vf_instance_t * vf, pgm_structure * input_image)
 600 {
 601   int x, y;
 602   pgm_structure * new_pgm = (pgm_structure *) safe_malloc (sizeof(pgm_structure));
 603   int has_anything_changed = 1;
 604   int current_pass;
 605   int max_mask_size;
 606   char * current_pixel;
 607
 608   new_pgm->width = input_image->width / 2;
 609   new_pgm->height = input_image->height / 2;
 610   new_pgm->pixel = (unsigned char *) safe_malloc (sizeof(unsigned char) * new_pgm->width * new_pgm->height);
 611
 612   /* Copy over the image data, using the average of 4 pixels for to calculate each downsampled pixel. */
 613   for (y = 0; y < new_pgm->height; y++)
 614     for (x = 0; x < new_pgm->width; x++)
 615     {
 616       /* Set the pixel if there exists a non-zero value in the source pixels, else clear it. */
 617       new_pgm->pixel[(y * new_pgm->width) + x] = input_image->pixel[((y << 1) * input_image->width) + (x << 1)] ||
 618                                                  input_image->pixel[((y << 1) * input_image->width) + (x << 1) + 1] ||
 619                                                  input_image->pixel[(((y << 1) + 1) * input_image->width) + (x << 1)] ||
 620                                                  input_image->pixel[(((y << 1) + 1) * input_image->width) + (x << 1) + 1];
 621       new_pgm->pixel[(y * new_pgm->width) + x] = min(1, new_pgm->pixel[(y * new_pgm->width) + x]);
 622     }
 623
 624   /* Now we need to recalculate the numbers for the smaller size. Just using the old_value / 2 can cause subtle
 625      and fairly rare, but very nasty, bugs. */
 626
 627   current_pixel = new_pgm->pixel;
 628   /* First pass, set all non-zero values to 1. */
 629   for (x = 0; x < new_pgm->height * new_pgm->width; x++, current_pixel++)
 630     if(*current_pixel) *current_pixel = 1;
 631
 632   /* Second pass and future passes. For each pass, if a pixel is itself the same value as the current pass,
 633      and its four neighbors are too, then it is incremented. If no pixels are incremented by the end of the pass,
 634      then we go again. Edge pixels are counted as always excluded (this should be true anyway for any sane mask,
 635      but if it isn't this will ensure that we eventually exit). */
 636   current_pass = 0;
 637   while (has_anything_changed)
 638   {
 639     current_pass++;
 640
 641     has_anything_changed = 0; /* If this doesn't get set by the end of this pass, then we're done. */
 642
 643     for (y = 1; y < new_pgm->height - 1; y++)
 644     {
 645       for (x = 1; x < new_pgm->width - 1; x++)
 646       {
 647         if (new_pgm->pixel[(y * new_pgm->width) + x] >= current_pass && /* By using >= instead of ==, we allow the algorithm to work in place. */
 648             new_pgm->pixel[(y * new_pgm->width) + (x + 1)] >= current_pass &&
 649             new_pgm->pixel[(y * new_pgm->width) + (x - 1)] >= current_pass &&
 650             new_pgm->pixel[((y + 1) * new_pgm->width) + x] >= current_pass &&
 651             new_pgm->pixel[((y - 1) * new_pgm->width) + x] >= current_pass)
 652          {
 653            new_pgm->pixel[(y * new_pgm->width) + x]++; /* Increment the value since it still has not been eroded,
 654                                                     as evidenced by the if statement that just evaluated to true. */
 655            has_anything_changed = 1;
 656          }
 657       }
 658     }
 659   }
 660
 661   for (y = 1; y < new_pgm->height - 1; y++)
 662   {
 663    for (x = 1; x < new_pgm->width - 1; x++)
 664     {
 665       new_pgm->pixel[(y * new_pgm->width) + x] = apply_mask_fudge_factor(new_pgm->pixel[(y * new_pgm->width) + x]);
 666     }
 667   }
 668
 669   max_mask_size = current_pass + 1; /* As a side-effect, we now know the maximum mask size, which we'll use to generate our masks. */
 670   max_mask_size = apply_mask_fudge_factor(max_mask_size);
 671   /* Commit the newly calculated max_mask_size to the vf->priv struct. */
 672   ((vf_priv_s *)vf->priv)->max_mask_size = max(max_mask_size, ((vf_priv_s *)vf->priv)->max_mask_size);
 673
 674   return new_pgm;
 675 }
 676
 677 /**
 678  * \brief Checks if YV12 is supported by the next filter.
 679  */
 680 static unsigned int find_best(struct vf_instance_s* vf){
 681   int is_format_okay = vf->next->query_format(vf->next, IMGFMT_YV12);
 682   if ((is_format_okay & VFCAP_CSP_SUPPORTED_BY_HW) || (is_format_okay & VFCAP_CSP_SUPPORTED))
 683     return IMGFMT_YV12;
 684   else
 685     return 0;
 686 }
 687
 688 //===========================================================================//
 689
 690 /**
 691  * \brief Configure the filter and call the next filter's config function.
 692  */
 693 static int config(struct vf_instance_s* vf, int width, int height, int d_width, int d_height, unsigned int flags, unsigned int outfmt)
 694 {
 695   if(!(((vf_priv_s *)vf->priv)->fmt=find_best(vf)))
 696     return 0;
 697   else
 698     return vf_next_config(vf,width,height,d_width,d_height,flags,((vf_priv_s *)vf->priv)->fmt);
 699 }
 700
 701 /**
 702  * \brief Removes the logo from a plane (either luma or chroma).
 703  *
 704  * \param vf Not needed by this function, but needed by the blur function.
 705  * \param source The image to have it's logo removed.
 706  * \param destination Where the output image will be stored.
 707  * \param source_stride How far apart (in memory) two consecutive lines are.
 708  * \param destination Same as source_stride, but for the destination image.
 709  * \param width Width of the image. This is the same for source and destination.
 710  * \param height Height of the image. This is the same for source and destination.
 711  * \param is_image_direct If the image is direct, then source and destination are
 712  *        the same and we can save a lot of time by not copying pixels that
 713  *        haven't changed.
 714  * \param filter The image that stores the distance to the edge of the logo for
 715  *        each pixel.
 716  * \param logo_start_x Smallest x-coordinate that contains at least 1 logo pixel.
 717  * \param logo_start_y Smallest y-coordinate that contains at least 1 logo pixel.
 718  * \param logo_end_x Largest x-coordinate that contains at least 1 logo pixel.
 719  * \param logo_end_y Largest y-coordinate that contains at least 1 logo pixel.
 720  *
 721  * This function processes an entire plane. Pixels outside of the logo are copied
 722  * to the output without change, and pixels inside the logo have the de-blurring
 723  * function applied.
 724  */
 725 static void convert_yv12(const vf_instance_t * const vf, const char * const source, const int source_stride,
 726                          const mp_image_t * const source_image, const int width, const int height,
 727                          char * const destination, const int destination_stride, int is_image_direct, pgm_structure * filter,
 728                          const int plane, const int logo_start_x, const int logo_start_y, const int logo_end_x, const int logo_end_y)
 729 {
 730   int y;
 731   int x;
 732
 733   /* These pointers point to where we are getting our pixel data (inside mpi) and where we are storing it (inside dmpi). */
 734   const unsigned char * source_line;
 735   unsigned char * destination_line;
 736
 737   if (!is_image_direct)
 738     memcpy_pic(destination, source, width, height, destination_stride, source_stride);
 739
 740   for (y = logo_start_y; y <= logo_end_y; y++)
 741   {
 742     source_line = (const unsigned char *) source + (source_stride * y);
 743     destination_line = (unsigned char *) destination + (destination_stride * y);
 744
 745     for (x = logo_start_x; x <= logo_end_x; x++)
 746     {
 747       unsigned int output;
 748
 749       if (filter->pixel[(y * filter->width) + x]) /* Only process if we are in the logo. */
 750       {
 751         get_blur(vf, &output, filter, source_image, x, y, plane);
 752         destination_line[x] = output;
 753       }
 754       else /* Else just copy the data. */
 755         if (!is_image_direct)
 756           destination_line[x] = source_line[x];
 757     }
 758   }
 759 }
 760
 761 /**
 762  * \brief Process a frame.
 763  *
 764  * \param mpi The image sent to use by the previous filter.
 765  * \param dmpi Where we will store the processed output image.
 766  * \param vf This is how the filter gets access to it's persistant data.
 767  *
 768  * \return The return code of the next filter, or 0 on failure/error.
 769  *
 770  * This function processes an entire frame. The frame is sent by the previous
 771  * filter, has the logo removed by the filter, and is then sent to the next
 772  * filter.
 773  */
 774 static int put_image(struct vf_instance_s* vf, mp_image_t *mpi, double pts){
 775     mp_image_t *dmpi;
 776
 777     dmpi=vf_get_image(vf->next,((vf_priv_s *)vf->priv)->fmt,
 778         MP_IMGTYPE_TEMP, MP_IMGFLAG_ACCEPT_STRIDE,
 779         mpi->w, mpi->h);
 780
 781     /* Check to make sure that the filter image and the video stream are the same size. */
 782     if ((((vf_priv_s *)vf->priv)->filter->width != mpi->w) || (((vf_priv_s *)vf->priv)->filter->height != mpi->h))
 783     {
 784       mp_msg(MSGT_VFILTER,MSGL_ERR, "Filter image and video stream are not of the same size. (Filter: %d x %d, Stream: %d x %d)\n",
 785              ((vf_priv_s *)vf->priv)->filter->width, ((vf_priv_s *)vf->priv)->filter->height, mpi->w, mpi->h);
 786       return 0;
 787     }
 788
 789     switch(dmpi->imgfmt){
 790     case IMGFMT_YV12:
 791           convert_yv12(vf, mpi->planes[0],  mpi->stride[0], mpi, mpi->w, mpi->h,
 792                           dmpi->planes[0], dmpi->stride[0],
 793                           mpi->flags & MP_IMGFLAG_DIRECT, ((vf_priv_s *)vf->priv)->filter, 0,
 794                           ((vf_priv_s *)vf->priv)->bounding_rectangle_posx1, ((vf_priv_s *)vf->priv)->bounding_rectangle_posy1,
 795                           ((vf_priv_s *)vf->priv)->bounding_rectangle_posx2, ((vf_priv_s *)vf->priv)->bounding_rectangle_posy2);
 796           convert_yv12(vf, mpi->planes[1],  mpi->stride[1], mpi, mpi->w / 2, mpi->h / 2,
 797                           dmpi->planes[1], dmpi->stride[1],
 798                           mpi->flags & MP_IMGFLAG_DIRECT, ((vf_priv_s *)vf->priv)->half_size_filter, 1,
 799                           ((vf_priv_s *)vf->priv)->bounding_rectangle_half_size_posx1, ((vf_priv_s *)vf->priv)->bounding_rectangle_half_size_posy1,
 800                           ((vf_priv_s *)vf->priv)->bounding_rectangle_half_size_posx2, ((vf_priv_s *)vf->priv)->bounding_rectangle_half_size_posy2);
 801           convert_yv12(vf, mpi->planes[2],  mpi->stride[2], mpi, mpi->w / 2, mpi->h / 2,
 802                           dmpi->planes[2], dmpi->stride[2],
 803                           mpi->flags & MP_IMGFLAG_DIRECT, ((vf_priv_s *)vf->priv)->half_size_filter, 2,
 804                           ((vf_priv_s *)vf->priv)->bounding_rectangle_half_size_posx1, ((vf_priv_s *)vf->priv)->bounding_rectangle_half_size_posy1,
 805                           ((vf_priv_s *)vf->priv)->bounding_rectangle_half_size_posx2, ((vf_priv_s *)vf->priv)->bounding_rectangle_half_size_posy2);
 806           break;
 807
 808     default:
 809         mp_msg(MSGT_VFILTER,MSGL_ERR,"Unhandled format: 0x%X\n",dmpi->imgfmt);
 810         return 0;
 811     }
 812
 813     return vf_next_put_image(vf,dmpi, pts);
 814 }
 815
 816 //===========================================================================//
 817
 818 /**
 819  * \brief Checks to see if the next filter accepts YV12 images.
 820  */
 821 static int query_format(struct vf_instance_s * vf, unsigned int fmt)
 822 {
 823   if (fmt == IMGFMT_YV12)
 824     return vf->next->query_format(vf->next, IMGFMT_YV12);
 825   else
 826     return 0;
 827 }
 828
 829 /**
 830  * \brief Initializes our filter.
 831  *
 832  * \param args The arguments passed in from the command line go here. This
 833  *             filter expects only a single argument telling it where the PGM
 834  *             or PPM file that describes the logo region is.
 835  *
 836  * This sets up our instance variables and parses the arguments to the filter.
 837  */
 838 static int open(vf_instance_t * vf, char * args)
 839 {
 840   vf->priv = safe_malloc(sizeof(vf_priv_s));
 841
 842   /* Load our filter image. */
 843   if (args)
 844     ((vf_priv_s *)vf->priv)->filter = load_pgm(args);
 845   else
 846   {
 847     mp_msg(MSGT_VFILTER, MSGL_ERR, "[vf]remove_logo usage: remove_logo=/path/to/filter_image_file.pgm\n");
 848     free(vf->priv);
 849     return 0;
 850   }
 851
 852   if (((vf_priv_s *)vf->priv)->filter == NULL)
 853   {
 854     /* Error message was displayed by load_pgm(). */
 855     free(vf->priv);
 856     return 0;
 857   }
 858
 859   /* Create the scaled down filter image for the chroma planes. */
 860   convert_mask_to_strength_mask(vf, ((vf_priv_s *)vf->priv)->filter);
 861   ((vf_priv_s *)vf->priv)->half_size_filter = generate_half_size_image(vf, ((vf_priv_s *)vf->priv)->filter);
 862
 863   /* Now that we know how many masks we need (the info is in vf), we can generate the masks. */
 864   initialize_masks(vf);
 865
 866   /* Calculate our bounding rectangles, which determine in what region the logo resides for faster processing. */
 867   calculate_bounding_rectangle(&((vf_priv_s *)vf->priv)->bounding_rectangle_posx1, &((vf_priv_s *)vf->priv)->bounding_rectangle_posy1,
 868                                &((vf_priv_s *)vf->priv)->bounding_rectangle_posx2, &((vf_priv_s *)vf->priv)->bounding_rectangle_posy2,
 869                                 ((vf_priv_s *)vf->priv)->filter);
 870   calculate_bounding_rectangle(&((vf_priv_s *)vf->priv)->bounding_rectangle_half_size_posx1,
 871                                &((vf_priv_s *)vf->priv)->bounding_rectangle_half_size_posy1,
 872                                &((vf_priv_s *)vf->priv)->bounding_rectangle_half_size_posx2,
 873                                &((vf_priv_s *)vf->priv)->bounding_rectangle_half_size_posy2,
 874                                 ((vf_priv_s *)vf->priv)->half_size_filter);
 875
 876   vf->config=config;
 877   vf->put_image=put_image;
 878   vf->query_format=query_format;
 879   return 1;
 880 }
 881
 882 /**
 883  * \brief Frees memory that our filter allocated.
 884  *
 885  * This is called at exit-time.
 886  */
 887 void uninit(vf_instance_t * vf)
 888 {
 889   /* Destroy our masks and images. */
 890   destroy_pgm(((vf_priv_s *)vf->priv)->filter);
 891   destroy_pgm(((vf_priv_s *)vf->priv)->half_size_filter);
 892   destroy_masks(vf);
 893
 894   /* Destroy our private structure that had been used to store those masks and images. */
 895   free(vf->priv);
 896
 897   return;
 898 }
 899
 900 /**
 901  * \brief Meta data about our filter.
 902  */
 903 vf_info_t vf_info_remove_logo = {
 904     "Removes a tv logo based on a mask image.",
 905     "remove-logo",
 906     "Robert Edele",
 907     "",
 908     open,
 909     NULL
 910 };
 911
 912 //===========================================================================//