libmpcodecs/vf_remove_logo.c

   1 /*
   2  * This filter loads a .pgm mask file showing where a logo is and uses
   3  * a blur transform to remove the logo.
   4  *
   5  * Copyright (C) 2005 Robert Edele <yartrebo@earthlink.net>
   6  *
   7  * This file is part of MPlayer.
   8  *
   9  * MPlayer is free software; you can redistribute it and/or modify
  10  * it under the terms of the GNU General Public License as published by
  11  * the Free Software Foundation; either version 2 of the License, or
  12  * (at your option) any later version.
  13  *
  14  * MPlayer is distributed in the hope that it will be useful,
  15  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  16  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  17  * GNU General Public License for more details.
  18  *
  19  * You should have received a copy of the GNU General Public License along
  20  * with MPlayer; if not, write to the Free Software Foundation, Inc.,
  21  * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
  22  */
  23
  24 /**
  25  * \file vf_remove_logo.c
  26  *
  27  * \brief Advanced blur-based logo removing filter.
  28
  29  *     Hello and welcome. This code implements a filter to remove annoying TV
  30  * logos and other annoying images placed onto a video stream. It works by filling
  31  * in the pixels that comprise the logo with neighboring pixels. The transform is
  32  * very loosely based on a gaussian blur, but it is different enough to merit its
  33  * own paragraph later on. It is a major improvement on the old delogo filter as
  34  * it both uses a better blurring algorithm and uses a bitmap to use an arbitrary
  35  * and generally much tighter fitting shape than a rectangle.
  36  *
  37  *     The filter requires 1 argument and has no optional arguments. It requires
  38  * a filter bitmap, which must be in PGM or PPM format. A sample invocation would
  39  * be -vf remove_logo=/home/username/logo_bitmaps/xyz.pgm.  Pixels with a value of
  40  * zero are not part of the logo, and non-zero pixels are part of the logo. If you
  41  * use white (255) for the logo and black (0) for the rest, you will be safe. For
  42  * making the filter bitmap, I recommend taking a screen capture of a black frame
  43  * with the logo visible, and then using The GIMP's threshold filter followed by
  44  * the erode filter once or twice. If needed, little splotches can be fixed
  45  * manually. Remember that if logo pixels are not covered, the filter quality will
  46  * be much reduced. Marking too many pixels as part of the logo doesn't hurt as
  47  * much, but it will increase the amount of blurring needed to cover over the
  48  * image and will destroy more information than necessary. Additionally, this blur
  49  * algorithm is O(n) = n^4, where n is the width and height of a hypothetical
  50  * square logo, so extra pixels will slow things down on a large lo
  51  *
  52  *     The logo removal algorithm has two key points. The first is that it
  53  * distinguishes between pixels in the logo and those not in the logo by using the
  54  * passed-in bitmap. Pixels not in the logo are copied over directly without being
  55  * modified and they also serve as source pixels for the logo fill-in. Pixels
  56  * inside the logo have the mask applied.
  57  *
  58  *     At init-time the bitmap is reprocessed internally, and the distance to the
  59  * nearest edge of the logo (Manhattan distance), along with a little extra to
  60  * remove rough edges, is stored in each pixel. This is done using an in-place
  61  * erosion algorithm, and incrementing each pixel that survives any given erosion.
  62  * Once every pixel is eroded, the maximum value is recorded, and a set of masks
  63  * from size 0 to this size are generaged. The masks are circular binary masks,
  64  * where each pixel within a radius N (where N is the size of the mask) is a 1,
  65  * and all other pixels are a 0. Although a gaussian mask would be more
  66  * mathematically accurate, a binary mask works better in practice because we
  67  * generally do not use the central pixels in the mask (because they are in the
  68  * logo region), and thus a gaussian mask will cause too little blur and thus a
  69  * very unstable image.
  70  *
  71  *     The mask is applied in a special way. Namely, only pixels in the mask that
  72  * line up to pixels outside the logo are used. The dynamic mask size means that
  73  * the mask is just big enough so that the edges touch pixels outside the logo, so
  74  * the blurring is kept to a minimum and at least the first boundary condition is
  75  * met (that the image function itself is continuous), even if the second boundary
  76  * condition (that the derivative of the image function is continuous) is not met.
  77  * A masking algorithm that does preserve the second boundary coundition
  78  * (perhaps something based on a highly-modified bi-cubic algorithm) should offer
  79  * even better results on paper, but the noise in a typical TV signal should make
  80  * anything based on derivatives hopelessly noisy.
  81  */
  82
  83 #include <stdio.h>
  84 #include <stdlib.h>
  85 #include <string.h>
  86 #include <ctype.h>
  87 #include <inttypes.h>
  88
  89 #include "osdep/io.h"
  90
  91 #include "config.h"
  92 #include "mp_msg.h"
  93 #include "libvo/fastmemcpy.h"
  94
  95 #include "img_format.h"
  96 #include "mp_image.h"
  97 #include "vf.h"
  98
  99 //===========================================================================//
 100
 101 /** \brief Returns the larger of the two arguments. **/
 102 #define max(x,y) ((x)>(y)?(x):(y))
 103 /** \brief Returns the smaller of the two arguments. **/
 104 #define min(x,y) ((x)>(y)?(y):(x))
 105
 106 /**
 107  * \brief Test if a pixel is part of the logo.
 108  */
 109 #define test_filter(image, x, y) ((unsigned char) (image->pixel[((y) * image->width) + (x)]))
 110
 111 /**
 112  * \brief Chooses a slightly larger mask size to improve performance.
 113  *
 114  * This function maps the absolute minimum mask size needed to the mask size we'll
 115  * actually use. f(x) = x (the smallest that will work) will produce the sharpest
 116  * results, but will be quite jittery. f(x) = 1.25x (what I'm using) is a good
 117  * tradeoff in my opinion. This will calculate only at init-time, so you can put a
 118  * long expression here without effecting performance.
 119  */
 120 #define apply_mask_fudge_factor(x) (((x) >> 2) + x)
 121
 122 /**
 123  * \brief Simple implementation of the PGM image format.
 124  *
 125  * This struct holds a bare-bones image loaded from a PGM or PPM file. Once
 126  * loaded and pre-processed, each pixel in this struct will contain how far from
 127  * the edge of the logo each pixel is, using the manhattan distance (|dx| + |dy|).
 128  *
 129  * pixels in char * pixel can be addressed using (y * width) + height.
 130  */
 131 typedef struct
 132 {
 133   unsigned int width;
 134   unsigned int height;
 135
 136   unsigned char * pixel;
 137
 138 } pgm_structure;
 139
 140 /**
 141  * \brief Stores persistant variables.
 142  *
 143  * Variables stored here are kept from frame to frame, and separate instances of
 144  * the filter will get their own separate copies.
 145  */
 146 struct vf_priv_s
 147 {
 148   unsigned int fmt; /* Not exactly sure of the use for this. It came with the example filter I used as a basis for this, and it looks like a lot of stuff will break if I remove it. */
 149   int max_mask_size; /* The largest possible mask size that will be needed with the given filter and corresponding half_size_filter. The half_size_filter can have a larger requirment in some rare (but not degenerate) cases. */
 150   int * * * mask; /* Stores our collection of masks. The first * is for an array of masks, the second for the y axis, and the third for the x axis. */
 151   pgm_structure * filter; /* Stores the full-size filter image. This is used to tell what pixels are in the logo or not in the luma plane. */
 152   pgm_structure * half_size_filter; /* Stores a 50% width and 50% height filter image. This is used to tell what pixels are in the logo or not in the chroma planes. */
 153   /* These 8 variables store the bounding rectangles that the logo resides in. */
 154   int bounding_rectangle_posx1;
 155   int bounding_rectangle_posy1;
 156   int bounding_rectangle_posx2;
 157   int bounding_rectangle_posy2;
 158   int bounding_rectangle_half_size_posx1;
 159   int bounding_rectangle_half_size_posy1;
 160   int bounding_rectangle_half_size_posx2;
 161   int bounding_rectangle_half_size_posy2;
 162 } vf_priv_s;
 163
 164 /**
 165  * \brief Mallocs memory and checks to make sure it succeeded.
 166  *
 167  * \param size How many bytes to allocate.
 168  *
 169  * \return A pointer to the freshly allocated memory block, or NULL on failutre.
 170  *
 171  * Mallocs memory, and checks to make sure it was successfully allocated. Because
 172  * of how MPlayer works, it cannot safely halt execution, but at least the user
 173  * will get an error message before the segfault happens.
 174  */
 175 static void * safe_malloc(int size)
 176 {
 177   void * answer = malloc(size);
 178   if (answer == NULL)
 179     mp_msg(MSGT_VFILTER, MSGL_ERR, "Unable to allocate memory in vf_remove_logo.c\n");
 180
 181   return answer;
 182 }
 183
 184 /**
 185  * \brief Calculates the smallest rectangle that will encompass the logo region.
 186  *
 187  * \param filter This image contains the logo around which the rectangle will
 188  *        will be fitted.
 189  *
 190  * The bounding rectangle is calculated by testing successive lines (from the four
 191  * sides of the rectangle) until no more can be removed without removing logo
 192  * pixels. The results are returned by reference to posx1, posy1, posx2, and
 193  * posy2.
 194  */
 195 static void calculate_bounding_rectangle(int * posx1, int * posy1, int * posx2, int * posy2, pgm_structure * filter)
 196 {
 197   int x; /* Temporary variables to run  */
 198   int y; /* through each row or column. */
 199   int start_x;
 200   int start_y;
 201   int end_x = filter->width - 1;
 202   int end_y = filter->height - 1;
 203   int did_we_find_a_logo_pixel = 0;
 204
 205   /* Let's find the top bound first. */
 206   for (start_x = 0; start_x < filter->width && !did_we_find_a_logo_pixel; start_x++)
 207   {
 208     for (y = 0; y < filter->height; y++)
 209     {
 210       did_we_find_a_logo_pixel |= test_filter(filter, start_x, y);
 211     }
 212   }
 213   start_x--;
 214
 215   /* Now the bottom bound. */
 216   did_we_find_a_logo_pixel = 0;
 217   for (end_x = filter->width - 1; end_x > start_x && !did_we_find_a_logo_pixel; end_x--)
 218   {
 219     for (y = 0; y < filter->height; y++)
 220     {
 221       did_we_find_a_logo_pixel |= test_filter(filter, end_x, y);
 222     }
 223   }
 224   end_x++;
 225
 226   /* Left bound. */
 227   did_we_find_a_logo_pixel = 0;
 228   for (start_y = 0; start_y < filter->height && !did_we_find_a_logo_pixel; start_y++)
 229   {
 230     for (x = 0; x < filter->width; x++)
 231     {
 232       did_we_find_a_logo_pixel |= test_filter(filter, x, start_y);
 233     }
 234   }
 235   start_y--;
 236
 237   /* Right bound. */
 238   did_we_find_a_logo_pixel = 0;
 239   for (end_y = filter->height - 1; end_y > start_y && !did_we_find_a_logo_pixel; end_y--)
 240   {
 241     for (x = 0; x < filter->width; x++)
 242     {
 243       did_we_find_a_logo_pixel |= test_filter(filter, x, end_y);
 244     }
 245   }
 246   end_y++;
 247
 248   *posx1 = start_x;
 249   *posy1 = start_y;
 250   *posx2 = end_x;
 251   *posy2 = end_y;
 252
 253   return;
 254 }
 255
 256 /**
 257  * \brief Free mask memory.
 258  *
 259  * \param vf Data structure which stores our persistant data, and is to be freed.
 260  *
 261  * We call this function when our filter is done. It will free the memory
 262  * allocated to the masks and leave the variables in a safe state.
 263  */
 264 static void destroy_masks(vf_instance_t * vf)
 265 {
 266   int a, b;
 267
 268   /* Load values from the vf->priv struct for faster dereferencing. */
 269   int * * * mask = vf->priv->mask;
 270   int max_mask_size = vf->priv->max_mask_size;
 271
 272   if (mask == NULL)
 273     return; /* Nothing allocated, so return before we segfault. */
 274
 275   /* Free all allocated memory. */
 276   for (a = 0; a <= max_mask_size; a++) /* Loop through each mask. */
 277   {
 278     for (b = -a; b <= a; b++) /* Loop through each scanline in a mask. */
 279     {
 280       free(mask[a][b + a]); /* Free a scanline. */
 281     }
 282     free(mask[a]); /* Free a mask. */
 283   }
 284   free(mask); /* Free the array of pointers pointing to the masks. */
 285
 286   /* Set the pointer to NULL, so that any duplicate calls to this function will not cause a crash. */
 287   vf->priv->mask = NULL;
 288
 289   return;
 290 }
 291
 292 /**
 293  * \brief Set up our array of masks.
 294  *
 295  * \param vf Where our filter stores persistance data, like these masks.
 296  *
 297  * This creates an array of progressively larger masks and calculates their
 298  * values. The values will not change during program execution once this function
 299  * is done.
 300  */
 301 static void initialize_masks(vf_instance_t * vf)
 302 {
 303   int a, b, c;
 304
 305   /* Load values from the vf->priv struct for faster dereferencing. */
 306   int * * * mask = vf->priv->mask;
 307   int max_mask_size = vf->priv->max_mask_size; /* This tells us how many masks we'll need to generate. */
 308
 309   /* Create a circular mask for each size up to max_mask_size. When the filter is applied, the mask size is
 310      determined on a pixel by pixel basis, with pixels nearer the edge of the logo getting smaller mask sizes. */
 311   mask = (int * * *) safe_malloc(sizeof(int * *) * (max_mask_size + 1));
 312   for (a = 0; a <= max_mask_size; a++)
 313   {
 314     mask[a] = (int * *) safe_malloc(sizeof(int *) * ((a * 2) + 1));
 315     for (b = -a; b <= a; b++)
 316     {
 317       mask[a][b + a] = (int *) safe_malloc(sizeof(int) * ((a * 2) + 1));
 318       for (c = -a; c <= a; c++)
 319       {
 320         if ((b * b) + (c * c) <= (a * a)) /* Circular 0/1 mask. */
 321           mask[a][b + a][c + a] = 1;
 322         else
 323           mask[a][b + a][c + a] = 0;
 324       }
 325     }
 326   }
 327
 328   /* Store values back to vf->priv so they aren't lost after the function returns. */
 329   vf->priv->mask = mask;
 330
 331   return;
 332 }
 333
 334 /**
 335  * \brief Pre-processes an image to give distance information.
 336  *
 337  * \param vf Data structure that holds persistant information. All it is used for
 338              in this function is to store the calculated max_mask_size variable.
 339  * \param mask This image will be converted from a greyscale image into a
 340  *             distance image.
 341  *
 342  * This function takes a greyscale image (pgm_structure * mask) and converts it
 343  * in place into a distance image. A distance image is zero for pixels ourside of
 344  * the logo and is the manhattan distance (|dx| + |dy|) for pixels inside of the
 345  * logo. This will overestimate the distance, but that is safe, and is far easier
 346  * to implement than a proper pythagorean distance since I'm using a modified
 347  * erosion algorithm to compute the distances.
 348  */
 349 static void convert_mask_to_strength_mask(vf_instance_t * vf, pgm_structure * mask)
 350 {
 351   int x, y; /* Used by our for loops to go through every single pixel in the picture one at a time. */
 352   int has_anything_changed = 1; /* Used by the main while() loop to know if anything changed on the last erosion. */
 353   int current_pass = 0; /* How many times we've gone through the loop. Used in the in-place erosion algorithm
 354                            and to get us max_mask_size later on. */
 355   int max_mask_size; /* This will record how large a mask the pixel that is the furthest from the edge of the logo
 356                            (and thus the neediest) is. */
 357   char * current_pixel = mask->pixel; /* This stores the actual pixel data. */
 358
 359   /* First pass, set all non-zero values to 1. After this loop finishes, the data should be considered numeric
 360      data for the filter, not color data. */
 361   for (x = 0; x < mask->height * mask->width; x++, current_pixel++)
 362     if(*current_pixel) *current_pixel = 1;
 363
 364   /* Second pass and future passes. For each pass, if a pixel is itself the same value as the current pass,
 365      and its four neighbors are too, then it is incremented. If no pixels are incremented by the end of the pass,
 366      then we go again. Edge pixels are counted as always excluded (this should be true anyway for any sane mask,
 367      but if it isn't this will ensure that we eventually exit). */
 368   while (has_anything_changed)
 369   {
 370     current_pass++;
 371     current_pixel = mask->pixel;
 372
 373     has_anything_changed = 0; /* If this doesn't get set by the end of this pass, then we're done. */
 374
 375     for (y = 1; y < mask->height - 1; y++)
 376     {
 377       for (x = 1; x < mask->width - 1; x++)
 378       {
 379         /* Apply the in-place erosion transform. It is based on the following two premises: 1 - Any pixel that fails 1 erosion
 380            will fail all future erosions. 2 - Only pixels having survived all erosions up to the present will be >= to
 381            current_pass. It doesn't matter if it survived the current pass, failed it, or hasn't been tested yet. */
 382         if (*current_pixel >= current_pass && /* By using >= instead of ==, we allow the algorithm to work in place. */
 383             *(current_pixel + 1) >= current_pass &&
 384             *(current_pixel - 1) >= current_pass &&
 385             *(current_pixel + mask->width) >= current_pass &&
 386             *(current_pixel - mask->width) >= current_pass)
 387          {
 388            (*current_pixel)++; /* Increment the value since it still has not been eroded, as evidenced by the if statement
 389                                   that just evaluated to true. */
 390            has_anything_changed = 1;
 391          }
 392         current_pixel++;
 393       }
 394     }
 395   }
 396
 397   /* Apply the fudge factor, which will increase the size of the mask a little to reduce jitter at the cost of more blur. */
 398   for (y = 1; y < mask->height - 1; y++)
 399   {
 400    for (x = 1; x < mask->width - 1; x++)
 401     {
 402       mask->pixel[(y * mask->width) + x] = apply_mask_fudge_factor(mask->pixel[(y * mask->width) + x]);
 403     }
 404   }
 405
 406   max_mask_size = current_pass + 1; /* As a side-effect, we now know the maximum mask size, which we'll use to generate our masks. */
 407   max_mask_size = apply_mask_fudge_factor(max_mask_size); /* Apply the fudge factor to this number too, since we must
 408                                                              ensure that enough masks are generated. */
 409   vf->priv->max_mask_size = max_mask_size; /* Commit the newly calculated max_mask_size to the vf->priv struct. */
 410
 411   return;
 412 }
 413
 414 /**
 415  * \brief Our blurring function.
 416  *
 417  * \param vf Stores persistant data. In this function we are interested in the
 418  *           array of masks.
 419  * \param value_out The properly blurred and delogoed pixel is outputted here.
 420  * \param logo_mask Tells us which pixels are in the logo and which aren't.
 421  * \param image The image that is having its logo removed.
 422  * \param x x-coordinate of the pixel to blur.
 423  * \param y y-coordinate of the pixel to blur.
 424  * \param plane 0 = luma, 1 = blue chroma, 2 = red chroma (YUV).
 425  *
 426  * This function is the core of the filter. It takes a pixel that is inside the
 427  * logo and blurs it. It does so by finding the average of all the pixels within
 428  * the mask and outside of the logo.
 429  */
 430 static void get_blur(const vf_instance_t * const vf, unsigned int * const value_out, const pgm_structure * const logo_mask,
 431               const mp_image_t * const image, const int x, const int y, const int plane)
 432 {
 433   int mask_size; /* Mask size tells how large a circle to use. The radius is about (slightly larger than) mask size. */
 434   /* Get values from vf->priv for faster dereferencing. */
 435   int * * * mask = vf->priv->mask;
 436
 437   int start_posx, start_posy, end_posx, end_posy;
 438   int i, j;
 439   unsigned int accumulator = 0, divisor = 0;
 440   const unsigned char * mask_read_position; /* What pixel we are reading out of the circular blur mask. */
 441   const unsigned char * logo_mask_read_position; /* What pixel we are reading out of the filter image. */
 442
 443   /* Prepare our bounding rectangle and clip it if need be. */
 444   mask_size = test_filter(logo_mask, x, y);
 445   start_posx = max(0, x - mask_size);
 446   start_posy = max(0, y - mask_size);
 447   end_posx = min(image->width - 1, x + mask_size);
 448   end_posy = min(image->height - 1, y + mask_size);
 449
 450   mask_read_position = image->planes[plane] + (image->stride[plane] * start_posy) + start_posx;
 451   logo_mask_read_position = logo_mask->pixel + (start_posy * logo_mask->width) + start_posx;
 452
 453   for (j = start_posy; j <= end_posy; j++)
 454   {
 455     for (i = start_posx; i <= end_posx; i++)
 456     {
 457       if (!(*logo_mask_read_position) && mask[mask_size][i - start_posx][j - start_posy])
 458       { /* Check to see if this pixel is in the logo or not. Only use the pixel if it is not. */
 459         accumulator += *mask_read_position;
 460         divisor++;
 461       }
 462
 463       mask_read_position++;
 464       logo_mask_read_position++;
 465     }
 466
 467     mask_read_position += (image->stride[plane] - ((end_posx + 1) - start_posx));
 468     logo_mask_read_position += (logo_mask->width - ((end_posx + 1) - start_posx));
 469   }
 470
 471   if (divisor == 0) /* This means that not a single pixel is outside of the logo, so we have no data. */
 472   { /* We should put some eye catching value here, to indicate the flaw to the user. */
 473     *value_out = 255;
 474   }
 475   else /* Else we need to normalise the data using the divisor. */
 476   {
 477     *value_out = (accumulator + (divisor / 2)) / divisor; /* Divide, taking into account average rounding error. */
 478   }
 479
 480   return;
 481 }
 482
 483 /**
 484  * \brief Free a pgm_structure. Undoes load_pgm(...).
 485  */
 486 static void destroy_pgm(pgm_structure * to_be_destroyed)
 487 {
 488   if (to_be_destroyed == NULL)
 489     return; /* Don't do anything if a NULL pointer was passed it. */
 490
 491   /* Internally allocated memory. */
 492   if (to_be_destroyed->pixel != NULL)
 493   {
 494     free(to_be_destroyed->pixel);
 495     to_be_destroyed->pixel = NULL;
 496   }
 497
 498   /* Free the actual struct instance. This is done here and not by the calling function. */
 499   free(to_be_destroyed);
 500 }
 501
 502 /** \brief Helper function for load_pgm(...) to skip whitespace. */
 503 static void load_pgm_skip(FILE *f) {
 504   int c, comment = 0;
 505   do {
 506     c = fgetc(f);
 507     if (c == '#')
 508       comment = 1;
 509     if (c == '\n')
 510       comment = 0;
 511   } while (c != EOF && (isspace(c) || comment));
 512   ungetc(c, f);
 513 }
 514
 515 #define REMOVE_LOGO_LOAD_PGM_ERROR_MESSAGE(message) {mp_msg(MSGT_VFILTER, MSGL_ERR, message); return NULL;}
 516
 517 /**
 518  * \brief Loads a raw pgm or ppm file into a newly created pgm_structure object.
 519  *
 520  * \param file_name The name of the file to be loaded. So long as the file is a
 521  *                  valid pgm or ppm file, it will load correctly, even if the
 522  *                  extension is missing or invalid.
 523  *
 524  * \return A pointer to the newly created pgm_structure object. Don't forget to
 525  *         call destroy_pgm(...) when you're done with this. If an error occurs,
 526  *         NULL is returned.
 527  *
 528  * Can load either raw pgm (P5) or raw ppm (P6) image files as a binary image.
 529  * While a pgm file will be loaded normally (greyscale), the only thing that is
 530  * guaranteed with ppm is that all zero (R = 0, G = 0, B = 0) pixels will remain
 531  * zero, and non-zero pixels will remain non-zero.
 532  */
 533 static pgm_structure * load_pgm(const char * file_name)
 534 {
 535   int maximum_greyscale_value;
 536   FILE * input;
 537   int pnm_number;
 538   pgm_structure * new_pgm = (pgm_structure *) safe_malloc (sizeof(pgm_structure));
 539   char * write_position;
 540   char * end_position;
 541   int image_size; /* width * height */
 542
 543   if((input = fopen(file_name, "rb")) == NULL) REMOVE_LOGO_LOAD_PGM_ERROR_MESSAGE("[vf]remove-logo: Unable to open file. File not found or insufficient permissions.\n");
 544
 545   /* Parse the PGM header. */
 546   if (fgetc(input) != 'P') REMOVE_LOGO_LOAD_PGM_ERROR_MESSAGE("[vf]remove-logo: File is not a valid PGM or PPM file.\n");
 547   pnm_number = fgetc(input) - '0';
 548   if (pnm_number != 5 && pnm_number != 6) REMOVE_LOGO_LOAD_PGM_ERROR_MESSAGE("[vf]remove-logo: Invalid PNM file. Only raw PGM (Portable Gray Map) and raw PPM (Portable Pixel Map) subtypes are allowed.\n");
 549   load_pgm_skip(input);
 550   if (fscanf(input, "%i", &(new_pgm->width)) != 1) REMOVE_LOGO_LOAD_PGM_ERROR_MESSAGE("[vf]remove-logo: Invalid PGM/PPM header.\n");
 551   load_pgm_skip(input);
 552   if (fscanf(input, "%i", &(new_pgm->height)) != 1) REMOVE_LOGO_LOAD_PGM_ERROR_MESSAGE("[vf]remove-logo: Invalid PGM/PPM header.\n");
 553   load_pgm_skip(input);
 554   if (fscanf(input, "%i", &maximum_greyscale_value) != 1) REMOVE_LOGO_LOAD_PGM_ERROR_MESSAGE("[vf]remove-logo: Invalid PGM/PPM header.\n");
 555   if (maximum_greyscale_value >= 256) REMOVE_LOGO_LOAD_PGM_ERROR_MESSAGE("[vf]remove_logo: Only 1 byte per pixel (pgm) or 1 byte per color value (ppm) are supported.\n");
 556   load_pgm_skip(input);
 557
 558   new_pgm->pixel = (unsigned char *) safe_malloc (sizeof(unsigned char) * new_pgm->width * new_pgm->height);
 559
 560   /* Load the pixels. */
 561   /* Note: I am aware that fgetc(input) isn't the fastest way of doing things, but it is quite compact and the code only runs once when the filter is initialized.*/
 562   image_size = new_pgm->width * new_pgm->height;
 563   end_position = new_pgm->pixel + image_size;
 564   for (write_position = new_pgm->pixel; write_position < end_position; write_position++)
 565   {
 566     *write_position = fgetc(input);
 567     if (pnm_number == 6) /* This tests to see if the file is a PPM file. */
 568     { /* If it is, then consider the pixel set if any of the three color channels are set. Since we just care about == 0 or != 0, a bitwise or will do the trick. */
 569       *write_position |= fgetc(input);
 570       *write_position |= fgetc(input);
 571     }
 572   }
 573
 574   return new_pgm;
 575 }
 576
 577 /**
 578  * \brief Generates a scaled down image with half width, height, and intensity.
 579  *
 580  * \param vf Our struct for persistant data. In this case, it is used to update
 581  *           mask_max_size with the larger of the old or new value.
 582  * \param input_image The image from which the new half-sized one will be based.
 583  *
 584  * \return The newly allocated and shrunken image.
 585  *
 586  * This function not only scales down an image, but halves the value in each pixel
 587  * too. The purpose of this is to produce a chroma filter image out of a luma
 588  * filter image. The pixel values store the distance to the edge of the logo and
 589  * halving the dimensions halves the distance. This function rounds up, because
 590  * a downwards rounding error could cause the filter to fail, but an upwards
 591  * rounding error will only cause a minor amount of excess blur in the chroma
 592  * planes.
 593  */
 594 static pgm_structure * generate_half_size_image(vf_instance_t * vf, pgm_structure * input_image)
 595 {
 596   int x, y;
 597   pgm_structure * new_pgm = (pgm_structure *) safe_malloc (sizeof(pgm_structure));
 598   int has_anything_changed = 1;
 599   int current_pass;
 600   int max_mask_size;
 601   char * current_pixel;
 602
 603   new_pgm->width = input_image->width / 2;
 604   new_pgm->height = input_image->height / 2;
 605   new_pgm->pixel = (unsigned char *) safe_malloc (sizeof(unsigned char) * new_pgm->width * new_pgm->height);
 606
 607   /* Copy over the image data, using the average of 4 pixels for to calculate each downsampled pixel. */
 608   for (y = 0; y < new_pgm->height; y++)
 609     for (x = 0; x < new_pgm->width; x++)
 610     {
 611       /* Set the pixel if there exists a non-zero value in the source pixels, else clear it. */
 612       new_pgm->pixel[(y * new_pgm->width) + x] = input_image->pixel[((y << 1) * input_image->width) + (x << 1)] ||
 613                                                  input_image->pixel[((y << 1) * input_image->width) + (x << 1) + 1] ||
 614                                                  input_image->pixel[(((y << 1) + 1) * input_image->width) + (x << 1)] ||
 615                                                  input_image->pixel[(((y << 1) + 1) * input_image->width) + (x << 1) + 1];
 616       new_pgm->pixel[(y * new_pgm->width) + x] = min(1, new_pgm->pixel[(y * new_pgm->width) + x]);
 617     }
 618
 619   /* Now we need to recalculate the numbers for the smaller size. Just using the old_value / 2 can cause subtle
 620      and fairly rare, but very nasty, bugs. */
 621
 622   current_pixel = new_pgm->pixel;
 623   /* First pass, set all non-zero values to 1. */
 624   for (x = 0; x < new_pgm->height * new_pgm->width; x++, current_pixel++)
 625     if(*current_pixel) *current_pixel = 1;
 626
 627   /* Second pass and future passes. For each pass, if a pixel is itself the same value as the current pass,
 628      and its four neighbors are too, then it is incremented. If no pixels are incremented by the end of the pass,
 629      then we go again. Edge pixels are counted as always excluded (this should be true anyway for any sane mask,
 630      but if it isn't this will ensure that we eventually exit). */
 631   current_pass = 0;
 632   while (has_anything_changed)
 633   {
 634     current_pass++;
 635
 636     has_anything_changed = 0; /* If this doesn't get set by the end of this pass, then we're done. */
 637
 638     for (y = 1; y < new_pgm->height - 1; y++)
 639     {
 640       for (x = 1; x < new_pgm->width - 1; x++)
 641       {
 642         if (new_pgm->pixel[(y * new_pgm->width) + x] >= current_pass && /* By using >= instead of ==, we allow the algorithm to work in place. */
 643             new_pgm->pixel[(y * new_pgm->width) + (x + 1)] >= current_pass &&
 644             new_pgm->pixel[(y * new_pgm->width) + (x - 1)] >= current_pass &&
 645             new_pgm->pixel[((y + 1) * new_pgm->width) + x] >= current_pass &&
 646             new_pgm->pixel[((y - 1) * new_pgm->width) + x] >= current_pass)
 647          {
 648            new_pgm->pixel[(y * new_pgm->width) + x]++; /* Increment the value since it still has not been eroded,
 649                                                     as evidenced by the if statement that just evaluated to true. */
 650            has_anything_changed = 1;
 651          }
 652       }
 653     }
 654   }
 655
 656   for (y = 1; y < new_pgm->height - 1; y++)
 657   {
 658    for (x = 1; x < new_pgm->width - 1; x++)
 659     {
 660       new_pgm->pixel[(y * new_pgm->width) + x] = apply_mask_fudge_factor(new_pgm->pixel[(y * new_pgm->width) + x]);
 661     }
 662   }
 663
 664   max_mask_size = current_pass + 1; /* As a side-effect, we now know the maximum mask size, which we'll use to generate our masks. */
 665   max_mask_size = apply_mask_fudge_factor(max_mask_size);
 666   /* Commit the newly calculated max_mask_size to the vf->priv struct. */
 667   vf->priv->max_mask_size = max(max_mask_size, vf->priv->max_mask_size);
 668
 669   return new_pgm;
 670 }
 671
 672 /**
 673  * \brief Checks if YV12 is supported by the next filter.
 674  */
 675 static unsigned int find_best(struct vf_instance *vf){
 676   int is_format_okay = vf->next->query_format(vf->next, IMGFMT_YV12);
 677   if ((is_format_okay & VFCAP_CSP_SUPPORTED_BY_HW) || (is_format_okay & VFCAP_CSP_SUPPORTED))
 678     return IMGFMT_YV12;
 679   else
 680     return 0;
 681 }
 682
 683 //===========================================================================//
 684
 685 /**
 686  * \brief Configure the filter and call the next filter's config function.
 687  */
 688 static int config(struct vf_instance *vf, int width, int height, int d_width, int d_height, unsigned int flags, unsigned int outfmt)
 689 {
 690   if(!(vf->priv->fmt=find_best(vf)))
 691     return 0;
 692   else
 693     return vf_next_config(vf,width,height,d_width,d_height,flags,vf->priv->fmt);
 694 }
 695
 696 /**
 697  * \brief Removes the logo from a plane (either luma or chroma).
 698  *
 699  * \param vf Not needed by this function, but needed by the blur function.
 700  * \param source The image to have it's logo removed.
 701  * \param destination Where the output image will be stored.
 702  * \param source_stride How far apart (in memory) two consecutive lines are.
 703  * \param destination Same as source_stride, but for the destination image.
 704  * \param width Width of the image. This is the same for source and destination.
 705  * \param height Height of the image. This is the same for source and destination.
 706  * \param is_image_direct If the image is direct, then source and destination are
 707  *        the same and we can save a lot of time by not copying pixels that
 708  *        haven't changed.
 709  * \param filter The image that stores the distance to the edge of the logo for
 710  *        each pixel.
 711  * \param logo_start_x Smallest x-coordinate that contains at least 1 logo pixel.
 712  * \param logo_start_y Smallest y-coordinate that contains at least 1 logo pixel.
 713  * \param logo_end_x Largest x-coordinate that contains at least 1 logo pixel.
 714  * \param logo_end_y Largest y-coordinate that contains at least 1 logo pixel.
 715  *
 716  * This function processes an entire plane. Pixels outside of the logo are copied
 717  * to the output without change, and pixels inside the logo have the de-blurring
 718  * function applied.
 719  */
 720 static void convert_yv12(const vf_instance_t * const vf, const char * const source, const int source_stride,
 721                          const mp_image_t * const source_image, const int width, const int height,
 722                          char * const destination, const int destination_stride, int is_image_direct, pgm_structure * filter,
 723                          const int plane, const int logo_start_x, const int logo_start_y, const int logo_end_x, const int logo_end_y)
 724 {
 725   int y;
 726   int x;
 727
 728   /* These pointers point to where we are getting our pixel data (inside mpi) and where we are storing it (inside dmpi). */
 729   const unsigned char * source_line;
 730   unsigned char * destination_line;
 731
 732   if (!is_image_direct)
 733     memcpy_pic(destination, source, width, height, destination_stride, source_stride);
 734
 735   for (y = logo_start_y; y <= logo_end_y; y++)
 736   {
 737     source_line = (const unsigned char *) source + (source_stride * y);
 738     destination_line = (unsigned char *) destination + (destination_stride * y);
 739
 740     for (x = logo_start_x; x <= logo_end_x; x++)
 741     {
 742       unsigned int output;
 743
 744       if (filter->pixel[(y * filter->width) + x]) /* Only process if we are in the logo. */
 745       {
 746         get_blur(vf, &output, filter, source_image, x, y, plane);
 747         destination_line[x] = output;
 748       }
 749       else /* Else just copy the data. */
 750         if (!is_image_direct)
 751           destination_line[x] = source_line[x];
 752     }
 753   }
 754 }
 755
 756 /**
 757  * \brief Process a frame.
 758  *
 759  * \param mpi The image sent to use by the previous filter.
 760  * \param dmpi Where we will store the processed output image.
 761  * \param vf This is how the filter gets access to it's persistant data.
 762  *
 763  * \return The return code of the next filter, or 0 on failure/error.
 764  *
 765  * This function processes an entire frame. The frame is sent by the previous
 766  * filter, has the logo removed by the filter, and is then sent to the next
 767  * filter.
 768  */
 769 static int put_image(struct vf_instance *vf, mp_image_t *mpi, double pts){
 770     mp_image_t *dmpi;
 771
 772     dmpi=vf_get_image(vf->next,vf->priv->fmt,
 773         MP_IMGTYPE_TEMP, MP_IMGFLAG_ACCEPT_STRIDE,
 774         mpi->w, mpi->h);
 775
 776     /* Check to make sure that the filter image and the video stream are the same size. */
 777     if (vf->priv->filter->width != mpi->w || vf->priv->filter->height != mpi->h)
 778     {
 779       mp_msg(MSGT_VFILTER,MSGL_ERR, "Filter image and video stream are not of the same size. (Filter: %d x %d, Stream: %d x %d)\n",
 780              vf->priv->filter->width, vf->priv->filter->height, mpi->w, mpi->h);
 781       return 0;
 782     }
 783
 784     switch(dmpi->imgfmt){
 785     case IMGFMT_YV12:
 786           convert_yv12(vf, mpi->planes[0],  mpi->stride[0], mpi, mpi->w, mpi->h,
 787                           dmpi->planes[0], dmpi->stride[0],
 788                           mpi->flags & MP_IMGFLAG_DIRECT, vf->priv->filter, 0,
 789                           vf->priv->bounding_rectangle_posx1, vf->priv->bounding_rectangle_posy1,
 790                           vf->priv->bounding_rectangle_posx2, vf->priv->bounding_rectangle_posy2);
 791           convert_yv12(vf, mpi->planes[1],  mpi->stride[1], mpi, mpi->w / 2, mpi->h / 2,
 792                           dmpi->planes[1], dmpi->stride[1],
 793                           mpi->flags & MP_IMGFLAG_DIRECT, vf->priv->half_size_filter, 1,
 794                           vf->priv->bounding_rectangle_half_size_posx1, vf->priv->bounding_rectangle_half_size_posy1,
 795                           vf->priv->bounding_rectangle_half_size_posx2, vf->priv->bounding_rectangle_half_size_posy2);
 796           convert_yv12(vf, mpi->planes[2],  mpi->stride[2], mpi, mpi->w / 2, mpi->h / 2,
 797                           dmpi->planes[2], dmpi->stride[2],
 798                           mpi->flags & MP_IMGFLAG_DIRECT, vf->priv->half_size_filter, 2,
 799                           vf->priv->bounding_rectangle_half_size_posx1, vf->priv->bounding_rectangle_half_size_posy1,
 800                           vf->priv->bounding_rectangle_half_size_posx2, vf->priv->bounding_rectangle_half_size_posy2);
 801           break;
 802
 803     default:
 804         mp_msg(MSGT_VFILTER,MSGL_ERR,"Unhandled format: 0x%X\n",dmpi->imgfmt);
 805         return 0;
 806     }
 807
 808     return vf_next_put_image(vf,dmpi, pts);
 809 }
 810
 811 //===========================================================================//
 812
 813 /**
 814  * \brief Checks to see if the next filter accepts YV12 images.
 815  */
 816 static int query_format(struct vf_instance *vf, unsigned int fmt)
 817 {
 818   if (fmt == IMGFMT_YV12)
 819     return vf->next->query_format(vf->next, IMGFMT_YV12);
 820   else
 821     return 0;
 822 }
 823
 824 /**
 825  * \brief Frees memory that our filter allocated.
 826  *
 827  * This is called at exit-time.
 828  */
 829 static void uninit(vf_instance_t *vf)
 830 {
 831   /* Destroy our masks and images. */
 832   destroy_pgm(vf->priv->filter);
 833   destroy_pgm(vf->priv->half_size_filter);
 834   destroy_masks(vf);
 835
 836   /* Destroy our private structure that had been used to store those masks and images. */
 837   free(vf->priv);
 838
 839   return;
 840 }
 841
 842 /**
 843  * \brief Initializes our filter.
 844  *
 845  * \param args The arguments passed in from the command line go here. This
 846  *             filter expects only a single argument telling it where the PGM
 847  *             or PPM file that describes the logo region is.
 848  *
 849  * This sets up our instance variables and parses the arguments to the filter.
 850  */
 851 static int vf_open(vf_instance_t *vf, char *args)
 852 {
 853   vf->priv = safe_malloc(sizeof(vf_priv_s));
 854   vf->uninit = uninit;
 855
 856   /* Load our filter image. */
 857   if (args)
 858     vf->priv->filter = load_pgm(args);
 859   else
 860   {
 861     mp_msg(MSGT_VFILTER, MSGL_ERR, "[vf]remove_logo usage: remove_logo=/path/to/filter_image_file.pgm\n");
 862     free(vf->priv);
 863     return 0;
 864   }
 865
 866   if (vf->priv->filter == NULL)
 867   {
 868     /* Error message was displayed by load_pgm(). */
 869     free(vf->priv);
 870     return 0;
 871   }
 872
 873   /* Create the scaled down filter image for the chroma planes. */
 874   convert_mask_to_strength_mask(vf, vf->priv->filter);
 875   vf->priv->half_size_filter = generate_half_size_image(vf, vf->priv->filter);
 876
 877   /* Now that we know how many masks we need (the info is in vf), we can generate the masks. */
 878   initialize_masks(vf);
 879
 880   /* Calculate our bounding rectangles, which determine in what region the logo resides for faster processing. */
 881   calculate_bounding_rectangle(&vf->priv->bounding_rectangle_posx1, &vf->priv->bounding_rectangle_posy1,
 882                                &vf->priv->bounding_rectangle_posx2, &vf->priv->bounding_rectangle_posy2,
 883                                 vf->priv->filter);
 884   calculate_bounding_rectangle(&vf->priv->bounding_rectangle_half_size_posx1,
 885                                &vf->priv->bounding_rectangle_half_size_posy1,
 886                                &vf->priv->bounding_rectangle_half_size_posx2,
 887                                &vf->priv->bounding_rectangle_half_size_posy2,
 888                                 vf->priv->half_size_filter);
 889
 890   vf->config=config;
 891   vf->put_image=put_image;
 892   vf->query_format=query_format;
 893   return 1;
 894 }
 895
 896 /**
 897  * \brief Meta data about our filter.
 898  */
 899 const vf_info_t vf_info_remove_logo = {
 900     "Removes a tv logo based on a mask image.",
 901     "remove-logo",
 902     "Robert Edele",
 903     "",
 904     vf_open,
 905     NULL
 906 };
 907
 908 //===========================================================================//