libvips/libvips/convolution/canny.c

515 lines
12 KiB
C

/* Canny edge detector
*/
/*
This file is part of VIPS.
VIPS is free software; you can redistribute it and/or modify
it under the terms of the GNU Lesser General Public License as published by
the Free Software Foundation; either version 2 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
02110-1301 USA
*/
/*
These files are distributed with VIPS - http://www.vips.ecs.soton.ac.uk
*/
/*
#define DEBUG
*/
#ifdef HAVE_CONFIG_H
#include <config.h>
#endif /*HAVE_CONFIG_H*/
#include <glib/gi18n-lib.h>
#include <stdio.h>
#include <stdlib.h>
#include <math.h>
#include <vips/vips.h>
typedef struct _VipsCanny {
VipsOperation parent_instance;
VipsImage *in;
VipsImage *out;
double sigma;
VipsPrecision precision;
/* Need an image vector for start_many.
*/
VipsImage *args[3];
} VipsCanny;
typedef VipsOperationClass VipsCannyClass;
G_DEFINE_TYPE( VipsCanny, vips_canny, VIPS_TYPE_OPERATION );
/* Simple 2x2 -1/+1 difference. For uchar, we try to hit the vector path and
* use an offset rather than -ves. Otherwise it's float or double output.
*/
static int
vips_canny_gradient( VipsImage *in, VipsImage **Gx, VipsImage **Gy )
{
VipsImage *scope;
VipsImage **t;
VipsPrecision precision;
scope = vips_image_new();
t = (VipsImage **) vips_object_local_array( (VipsObject *) scope, 2 );
t[0] = vips_image_new_matrixv( 2, 2,
-1.0, 1.0,
-1.0, 1.0 );
if( in->BandFmt == VIPS_FORMAT_UCHAR ) {
precision = VIPS_PRECISION_INTEGER;
vips_image_set_double( t[0], "offset", 128.0 );
}
else
precision = VIPS_PRECISION_FLOAT;
if( vips_conv( in, Gx, t[0], "precision", precision, NULL ) ||
vips_rot90( t[0], &t[1], NULL ) ||
vips_conv( in, Gy, t[1], "precision", precision, NULL ) ) {
g_object_unref( scope );
return( -1 );
}
g_object_unref( scope );
return( 0 );
}
/* LUT for calculating atan2() with +/- 4 bits of precision in each axis.
*/
static VipsPel vips_canny_polar_atan2[256];
/* For the uchar path, gx/gy are -128 to +127, and we need -8 to +7 for the
* atan2 LUT.
*
* For G, we should calculate sqrt( gx * gx + gy * gy ), however we are only
* interested in relative magnitude (max of sqrt), so we can skip the sqrt
* itself. We need a result that will fit in 0 - 255, so shift down.
*/
#define POLAR_UCHAR { \
for( x = 0; x < r->width; x++ ) { \
for( band = 0; band < Gx->Bands; band++ ) { \
int gx = p1[band] - 128; \
int gy = p2[band] - 128; \
\
int i = ((gx >> 4) & 0xf) | (gy & 0xf0); \
\
q[0] = (gx * gx + gy * gy + 256) >> 9; \
q[1] = vips_canny_polar_atan2[i]; \
\
q += 2; \
} \
\
p1 += Gx->Bands; \
p2 += Gx->Bands; \
} \
}
/* Float/double path. We keep the same ranges as the uchar path to reduce
* confusion.
*/
#define POLAR( TYPE ) { \
TYPE *tp1 = (TYPE *) p1; \
TYPE *tp2 = (TYPE *) p2; \
TYPE *tq = (TYPE *) q; \
\
for( x = 0; x < r->width; x++ ) { \
for( band = 0; band < Gx->Bands; band++ ) { \
double gx = tp1[band]; \
double gy = tp2[band]; \
double theta = VIPS_DEG( atan2( gx, gy ) ); \
\
tq[0] = (gx * gx + gy * gy + 256.0) / 512.0; \
tq[1] = 256.0 * fmod( theta + 360.0, 360.0 ) / 360.0; \
\
tq += 2; \
} \
\
tp1 += Gx->Bands; \
tp2 += Gx->Bands; \
} \
}
static int
vips_canny_polar_generate( VipsRegion *or,
void *vseq, void *a, void *b, gboolean *stop )
{
VipsRegion **in = (VipsRegion **) vseq;
VipsRect *r = &or->valid;
VipsImage *Gx = in[0]->im;
int x, y, band;
if( vips_reorder_prepare_many( or->im, in, r ) )
return( -1 );
for( y = 0; y < r->height; y++ ) {
VipsPel *p1 = (VipsPel * restrict)
VIPS_REGION_ADDR( in[0], r->left, r->top + y );
VipsPel *p2 = (VipsPel * restrict)
VIPS_REGION_ADDR( in[1], r->left, r->top + y );
VipsPel *q = (VipsPel * restrict)
VIPS_REGION_ADDR( or, r->left, r->top + y );
switch( Gx->BandFmt ) {
case VIPS_FORMAT_UCHAR:
POLAR_UCHAR;
break;
case VIPS_FORMAT_FLOAT:
POLAR( float );
break;
case VIPS_FORMAT_DOUBLE:
POLAR( double );
break;
default:
g_assert( FALSE );
}
}
return( 0 );
}
static void *
vips_atan2_init( void *null )
{
int i;
for( i = 0; i < 256; i++ ) {
/* Use the bottom 4 bits for x, the top 4 for y. The double
* shift does sign extension, assuming 2s complement.
*/
int bits = sizeof( int ) * 8 - 4;
int x = ((i & 0xf) << bits) >> bits;
int y = ((i >> 4) & 0x0f) << bits >> bits;
double theta = VIPS_DEG( atan2( x, y ) ) + 360;
vips_canny_polar_atan2[i] = 256 * theta / 360;
}
return( NULL );
}
/* Calculate G/theta from Gx/Gy. We code theta as 0-256 for 0-360
* and skip the sqrt on G.
*
* For a white disc on a black background, theta is 0 at the top, 64 on the
* left, 128 on the right and 192 on the right edge.
*/
static int
vips_canny_polar( VipsImage **args, VipsImage **out )
{
static GOnce once = G_ONCE_INIT;
g_once( &once, vips_atan2_init, NULL );
*out = vips_image_new();
if( vips_image_pipeline_array( *out,
VIPS_DEMAND_STYLE_THINSTRIP, args ) )
return( -1 );
(*out)->Bands *= 2;
if( vips_image_generate( *out,
vips_start_many, vips_canny_polar_generate, vips_stop_many,
args, NULL ) )
return( -1 );
return( 0 );
}
#define THIN( TYPE ) { \
TYPE *tp = (TYPE *) p; \
TYPE *tq = (TYPE *) q; \
\
for( x = 0; x < r->width; x++ ) { \
for( band = 0; band < out_bands; band++ ) { \
TYPE G = tp[lsk + psk]; \
TYPE theta = tp[lsk + psk + 1]; \
int low_theta = ((int) (theta / 32)) & 0x7; \
int high_theta = (low_theta + 1) & 0x7; \
TYPE residual = theta - low_theta * 32; \
TYPE lowa = tp[offset[low_theta]]; \
TYPE lowb = tp[offset[high_theta]]; \
TYPE low = (lowa * (32 - residual) + \
lowb * residual) / 32; \
TYPE higha = tp[offset[(low_theta + 4) & 0x7]]; \
TYPE highb = tp[offset[(high_theta + 4) & 0x7]]; \
TYPE high = (higha * (32 - residual) + \
highb * residual) / 32; \
\
if( G <= low || \
G < high ) \
G = 0; \
\
tq[band] = G; \
\
tp += 2; \
} \
\
tq += out_bands; \
} \
}
static int
vips_canny_thin_generate( VipsRegion *or,
void *vseq, void *a, void *b, gboolean *stop )
{
VipsRegion *in = (VipsRegion *) vseq;
VipsRect *r = &or->valid;
VipsImage *im = in->im;
int out_bands = or->im->Bands;
VipsRect rect;
int x, y, band;
int lsk;
int psk;
int offset[8];
rect = *r;
rect.width += 2;
rect.height += 2;
if( vips_region_prepare( in, &rect ) )
return( -1 );
/* These are in typed units.
*/
lsk = VIPS_REGION_LSKIP( in ) / VIPS_IMAGE_SIZEOF_ELEMENT( im );
psk = VIPS_IMAGE_SIZEOF_PEL( im ) / VIPS_IMAGE_SIZEOF_ELEMENT( im );
/* For each of the 8 directions, the offset to get to that pixel from
* the top-left of the 3x3.
*
* 1 | 0 | 7
* --+---+--
* 2 | X | 6
* --+---+--
* 3 | 4 | 5
*/
offset[0] = psk;
offset[1] = 0;
offset[2] = lsk;
offset[3] = 2 * lsk;
offset[4] = 2 * lsk + psk;
offset[5] = 2 * lsk + 2 * psk;
offset[6] = lsk + 2 * psk;
offset[7] = 2 * psk;
for( y = 0; y < r->height; y++ ) {
VipsPel *p = (VipsPel * restrict)
VIPS_REGION_ADDR( in, r->left, r->top + y );
VipsPel *q = (VipsPel * restrict)
VIPS_REGION_ADDR( or, r->left, r->top + y );
switch( im->BandFmt ) {
case VIPS_FORMAT_UCHAR:
THIN( unsigned char );
break;
case VIPS_FORMAT_FLOAT:
THIN( float );
break;
case VIPS_FORMAT_DOUBLE:
THIN( double );
break;
default:
g_assert( FALSE );
}
}
return( 0 );
}
/* Remove non-maximal edges. At each point, compare the G to the G in either
* direction and 0 it if it's not the largest.
*/
static int
vips_canny_thin( VipsImage *in, VipsImage **out )
{
*out = vips_image_new();
if( vips_image_pipelinev( *out,
VIPS_DEMAND_STYLE_THINSTRIP, in, NULL ) )
return( -1 );
(*out)->Bands /= 2;
(*out)->Xsize -= 2;
(*out)->Ysize -= 2;
if( vips_image_generate( *out,
vips_start_one, vips_canny_thin_generate, vips_stop_one,
in, NULL ) )
return( -1 );
return( 0 );
}
static int
vips_canny_build( VipsObject *object )
{
VipsCanny *canny = (VipsCanny *) object;
VipsImage **t = (VipsImage **) vips_object_local_array( object, 6 );
VipsImage *in;
if( VIPS_OBJECT_CLASS( vips_canny_parent_class )->build( object ) )
return( -1 );
in = canny->in;
if( vips_gaussblur( in, &t[0], canny->sigma,
"precision", canny->precision,
NULL ) )
return( -1 );
in = t[0];
if( vips_canny_gradient( in, &t[1], &t[2] ) )
return( -1 );
/* Form (G, theta).
*/
canny->args[0] = t[1];
canny->args[1] = t[2];
canny->args[2] = NULL;
if( vips_canny_polar( canny->args, &t[3] ) )
return( -1 );
in = t[3];
/* Expand by two pixels all around, then thin in the direction of the
* gradient.
*/
if( vips_embed( in, &t[4], 1, 1, in->Xsize + 2, in->Ysize + 2,
"extend", VIPS_EXTEND_COPY,
NULL ) )
return( -1 );
if( vips_canny_thin( t[4], &t[5] ) )
return( -1 );
in = t[5];
g_object_set( object, "out", vips_image_new(), NULL );
if( vips_image_write( in, canny->out ) )
return( -1 );
return( 0 );
}
static void
vips_canny_class_init( VipsCannyClass *class )
{
GObjectClass *gobject_class = G_OBJECT_CLASS( class );
VipsObjectClass *object_class = (VipsObjectClass *) class;
VipsOperationClass *operation_class = VIPS_OPERATION_CLASS( class );
gobject_class->set_property = vips_object_set_property;
gobject_class->get_property = vips_object_get_property;
object_class->nickname = "canny";
object_class->description = _( "Canny edge detector" );
object_class->build = vips_canny_build;
operation_class->flags = VIPS_OPERATION_SEQUENTIAL;
VIPS_ARG_IMAGE( class, "in", 1,
_( "Input" ),
_( "Input image" ),
VIPS_ARGUMENT_REQUIRED_INPUT,
G_STRUCT_OFFSET( VipsCanny, in ) );
VIPS_ARG_IMAGE( class, "out", 2,
_( "Output" ),
_( "Output image" ),
VIPS_ARGUMENT_REQUIRED_OUTPUT,
G_STRUCT_OFFSET( VipsCanny, out ) );
VIPS_ARG_DOUBLE( class, "sigma", 10,
_( "Sigma" ),
_( "Sigma of Gaussian" ),
VIPS_ARGUMENT_OPTIONAL_INPUT,
G_STRUCT_OFFSET( VipsCanny, sigma ),
0.01, 1000, 1.4 );
VIPS_ARG_ENUM( class, "precision", 103,
_( "Precision" ),
_( "Convolve with this precision" ),
VIPS_ARGUMENT_OPTIONAL_INPUT,
G_STRUCT_OFFSET( VipsCanny, precision ),
VIPS_TYPE_PRECISION, VIPS_PRECISION_FLOAT );
}
static void
vips_canny_init( VipsCanny *canny )
{
canny->sigma = 1.4;
canny->precision = VIPS_PRECISION_FLOAT;
}
/**
* vips_canny: (method)
* @in: input image
* @out: (out): output image
* @...: %NULL-terminated list of optional named arguments
*
* Optional arguments:
*
* * @sigma: %gdouble, sigma for gaussian blur
* * @precision: #VipsPrecision, calculation accuracy
*
* Find edges by Canny's method: The maximum of the derivative of the gradient
* in the direction of the gradient. Output is float, except for uchar input,
* where output is uchar, and double input, where output is double. Non-complex
* images only.
*
* Use @sigma to control the scale over which gradient is measured. 1.4 is
* usually a good value.
*
* Use @precision to set the precision of edge detection. For uchar images,
* setting this to #VIPS_PRECISION_INTEGER will make edge detection much
* faster, but sacrifice some sensitivity.
*
* You will probably need to process the output further to eliminate weak
* edges.
*
* See also: vips_sobel().
*
* Returns: 0 on success, -1 on error.
*/
int
vips_canny( VipsImage *in, VipsImage **out, ... )
{
va_list ap;
int result;
va_start( ap, out );
result = vips_call_split( "canny", ap, in, out );
va_end( ap );
return( result );
}