remove old fftw2 path, reduce mem use
This commit is contained in:
parent
bf10ec7432
commit
d621cd1f38
@ -69,7 +69,8 @@
|
|||||||
- new Python binding based on gobject-introspection
|
- new Python binding based on gobject-introspection
|
||||||
- only spot options at the end of arg strings
|
- only spot options at the end of arg strings
|
||||||
- add vips_cache() as a vips8 operator
|
- add vips_cache() as a vips8 operator
|
||||||
- remove the old fft fallbacks
|
- remove the old fft fallback
|
||||||
|
- remove fftw2 support
|
||||||
|
|
||||||
14/1/12 started 7.26.8
|
14/1/12 started 7.26.8
|
||||||
- interpolate CLI args were broken (thanks speckins)
|
- interpolate CLI args were broken (thanks speckins)
|
||||||
|
4
TODO
4
TODO
@ -1,5 +1,9 @@
|
|||||||
- add a fft test to the suite
|
- add a fft test to the suite
|
||||||
|
|
||||||
|
can we get fft memuse down? nip2 cache fills mem very quickly when painting
|
||||||
|
on an fft since it tries to keep the last 10,000 images :( the new vips
|
||||||
|
cache should be much better, of course
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
24
configure.in
24
configure.in
@ -331,18 +331,16 @@ GTK_DOC_CHECK(1.9)
|
|||||||
|
|
||||||
# optional supporting libraries
|
# optional supporting libraries
|
||||||
|
|
||||||
# we can wrap fftw3 and fftw2 ... but just look for fftw3, since we can do
|
AC_ARG_WITH([fftw],
|
||||||
# that with pkg-config
|
AS_HELP_STRING([--without-fftw], [build without fftw (default: test)]))
|
||||||
AC_ARG_WITH([fftw3],
|
|
||||||
AS_HELP_STRING([--without-fftw3], [build without fftw3 (default: test)]))
|
|
||||||
|
|
||||||
if test x"$with_fftw3" != "xno"; then
|
if test x"$with_fftw" != "xno"; then
|
||||||
PKG_CHECK_MODULES(FFTW3, fftw3,
|
PKG_CHECK_MODULES(FFTW, fftw3,
|
||||||
[AC_DEFINE(HAVE_FFTW3,1,[define if you have fftw3 installed.])
|
[AC_DEFINE(HAVE_FFTW,1,[define if you have fftw3 installed.])
|
||||||
with_fftw3=yes
|
with_fftw=yes
|
||||||
PACKAGES_USED="$PACKAGES_USED fftw3"],
|
PACKAGES_USED="$PACKAGES_USED fftw3"],
|
||||||
[AC_MSG_WARN([fftw3 not found; disabling fftw support])
|
[AC_MSG_WARN([fftw not found; disabling fftw support])
|
||||||
with_fftw3=no])
|
with_fftw=no])
|
||||||
fi
|
fi
|
||||||
|
|
||||||
# ImageMagick ... detect attribute iteration too
|
# ImageMagick ... detect attribute iteration too
|
||||||
@ -654,14 +652,14 @@ fi
|
|||||||
# Gather all up for VIPS_CFLAGS, VIPS_INCLUDES, VIPS_LIBS and VIPS_CXX_LIBS
|
# Gather all up for VIPS_CFLAGS, VIPS_INCLUDES, VIPS_LIBS and VIPS_CXX_LIBS
|
||||||
# sort includes to get longer, more specific dirs first
|
# sort includes to get longer, more specific dirs first
|
||||||
# helps, for example, selecting graphicsmagick over imagemagick
|
# helps, for example, selecting graphicsmagick over imagemagick
|
||||||
VIPS_CFLAGS=`for i in $VIPS_CFLAGS $GTHREAD_CFLAGS $REQUIRED_CFLAGS $PANGOFT2_CFLAGS $FFTW3_CFLAGS $MAGICK_CFLAGS $PNG_CFLAGS $EXIF_CFLAGS $MATIO_CFLAGS $CFITSIO_CFLAGS $OPENEXR_CFLAGS $OPENSLIDE_CFLAGS $ORC_CFLAGS
|
VIPS_CFLAGS=`for i in $VIPS_CFLAGS $GTHREAD_CFLAGS $REQUIRED_CFLAGS $PANGOFT2_CFLAGS $FFTW_CFLAGS $MAGICK_CFLAGS $PNG_CFLAGS $EXIF_CFLAGS $MATIO_CFLAGS $CFITSIO_CFLAGS $OPENEXR_CFLAGS $OPENSLIDE_CFLAGS $ORC_CFLAGS
|
||||||
do
|
do
|
||||||
echo $i
|
echo $i
|
||||||
done | sort -ru`
|
done | sort -ru`
|
||||||
VIPS_CFLAGS=`echo $VIPS_CFLAGS`
|
VIPS_CFLAGS=`echo $VIPS_CFLAGS`
|
||||||
VIPS_CFLAGS="$VIPS_DEBUG_FLAGS $VIPS_CFLAGS"
|
VIPS_CFLAGS="$VIPS_DEBUG_FLAGS $VIPS_CFLAGS"
|
||||||
VIPS_INCLUDES="$PNG_INCLUDES $TIFF_INCLUDES $ZIP_INCLUDES $JPEG_INCLUDES $FFTW_INCLUDES $LCMS_INCLUDES"
|
VIPS_INCLUDES="$PNG_INCLUDES $TIFF_INCLUDES $ZIP_INCLUDES $JPEG_INCLUDES $FFTW_INCLUDES $LCMS_INCLUDES"
|
||||||
VIPS_LIBS="$MAGICK_LIBS $PNG_LIBS $TIFF_LIBS $ZIP_LIBS $JPEG_LIBS $GTHREAD_LIBS $REQUIRED_LIBS $PANGOFT2_LIBS $FFTW3_LIBS $FFTW_LIBS $ORC_LIBS $LCMS_LIBS $OPENEXR_LIBS $OPENSLIDE_LIBS $CFITSIO_LIBS $MATIO_LIBS $EXIF_LIBS -lm"
|
VIPS_LIBS="$MAGICK_LIBS $PNG_LIBS $TIFF_LIBS $ZIP_LIBS $JPEG_LIBS $GTHREAD_LIBS $REQUIRED_LIBS $PANGOFT2_LIBS $FFTW_LIBS $ORC_LIBS $LCMS_LIBS $OPENEXR_LIBS $OPENSLIDE_LIBS $CFITSIO_LIBS $MATIO_LIBS $EXIF_LIBS -lm"
|
||||||
|
|
||||||
# we need this to generate paths in swig/python/setup.py.in
|
# we need this to generate paths in swig/python/setup.py.in
|
||||||
AC_SUBST(top_srcdir)
|
AC_SUBST(top_srcdir)
|
||||||
@ -731,7 +729,7 @@ build docs with gtkdoc: $enable_gtk_doc
|
|||||||
gobject introspection: $found_introspection
|
gobject introspection: $found_introspection
|
||||||
|
|
||||||
* optional packages and modules
|
* optional packages and modules
|
||||||
use fftw3 for FFT: $with_fftw3
|
use fftw3 for FFT: $with_fftw
|
||||||
Magick package: $with_magickpackage
|
Magick package: $with_magickpackage
|
||||||
file import with libMagick: $with_magick
|
file import with libMagick: $with_magick
|
||||||
accelerate loops with orc: $with_orc
|
accelerate loops with orc: $with_orc
|
||||||
|
@ -72,208 +72,14 @@
|
|||||||
#include <math.h>
|
#include <math.h>
|
||||||
|
|
||||||
#ifdef HAVE_FFTW
|
#ifdef HAVE_FFTW
|
||||||
#include <rfftw.h>
|
|
||||||
#endif /*HAVE_FFTW*/
|
|
||||||
|
|
||||||
#ifdef HAVE_FFTW3
|
|
||||||
#include <fftw3.h>
|
#include <fftw3.h>
|
||||||
#endif /*HAVE_FFTW3*/
|
#endif /*HAVE_FFTW*/
|
||||||
|
|
||||||
#include <vips/vips.h>
|
#include <vips/vips.h>
|
||||||
#include <vips/internal.h>
|
#include <vips/internal.h>
|
||||||
|
|
||||||
#ifdef HAVE_FFTW
|
#ifdef HAVE_FFTW
|
||||||
|
|
||||||
/* Call rfftw for a 1 band real image.
|
|
||||||
*/
|
|
||||||
static int
|
|
||||||
rfwfft1( IMAGE *dummy, IMAGE *in, IMAGE *out )
|
|
||||||
{
|
|
||||||
const guint64 size = VIPS_IMAGE_N_PELS( in );
|
|
||||||
const int half_width = in->Xsize / 2 + 1;
|
|
||||||
|
|
||||||
/* Pack to double real here.
|
|
||||||
*/
|
|
||||||
IMAGE *real = im_open_local( dummy, "fwfft1:1", "t" );
|
|
||||||
|
|
||||||
/* Transform to halfcomplex here.
|
|
||||||
*/
|
|
||||||
double *half_complex = IM_ARRAY( dummy,
|
|
||||||
in->Ysize * half_width * 2, double );
|
|
||||||
|
|
||||||
rfftwnd_plan plan;
|
|
||||||
double *buf, *q, *p;
|
|
||||||
int x, y;
|
|
||||||
|
|
||||||
if( !real || !half_complex || im_pincheck( in ) || im_outcheck( out ) )
|
|
||||||
return( -1 );
|
|
||||||
if( in->Coding != IM_CODING_NONE || in->Bands != 1 ) {
|
|
||||||
im_error( "im_fwfft", _( "one band uncoded only" ) );
|
|
||||||
return( -1 );
|
|
||||||
}
|
|
||||||
if( im_clip2fmt( in, real, IM_BANDFMT_DOUBLE ) )
|
|
||||||
return( -1 );
|
|
||||||
|
|
||||||
/* Make the plan for the transform. Yes, they really do use nx for
|
|
||||||
* height and ny for width.
|
|
||||||
*/
|
|
||||||
if( !(plan = rfftw2d_create_plan( in->Ysize, in->Xsize,
|
|
||||||
FFTW_FORWARD, FFTW_MEASURE | FFTW_USE_WISDOM )) ) {
|
|
||||||
im_error( "im_fwfft", _( "unable to create transform plan" ) );
|
|
||||||
return( -1 );
|
|
||||||
}
|
|
||||||
|
|
||||||
rfftwnd_one_real_to_complex( plan,
|
|
||||||
(fftw_real *) real->data, (fftw_complex *) half_complex );
|
|
||||||
|
|
||||||
rfftwnd_destroy_plan( plan );
|
|
||||||
|
|
||||||
/* WIO to out.
|
|
||||||
*/
|
|
||||||
if( im_cp_desc( out, in ) )
|
|
||||||
return( -1 );
|
|
||||||
out->BandFmt = IM_BANDFMT_DPCOMPLEX;
|
|
||||||
if( im_setupout( out ) )
|
|
||||||
return( -1 );
|
|
||||||
if( !(buf = (double *) IM_ARRAY( dummy,
|
|
||||||
IM_IMAGE_SIZEOF_LINE( out ), VipsPel )) )
|
|
||||||
return( -1 );
|
|
||||||
|
|
||||||
/* Copy to out and normalise. The right half is the up/down and
|
|
||||||
* left/right flip of the left, but conjugated. Do the first
|
|
||||||
* row separately, then mirror around the centre row.
|
|
||||||
*/
|
|
||||||
p = half_complex;
|
|
||||||
q = buf;
|
|
||||||
|
|
||||||
for( x = 0; x < half_width; x++ ) {
|
|
||||||
q[0] = p[0] / size;
|
|
||||||
q[1] = p[1] / size;
|
|
||||||
p += 2;
|
|
||||||
q += 2;
|
|
||||||
}
|
|
||||||
|
|
||||||
p = half_complex + ((in->Xsize + 1) / 2 - 1) * 2;
|
|
||||||
|
|
||||||
for( x = half_width; x < out->Xsize; x++ ) {
|
|
||||||
q[0] = p[0] / size;
|
|
||||||
q[1] = -1.0 * p[1] / size;
|
|
||||||
p -= 2;
|
|
||||||
q += 2;
|
|
||||||
}
|
|
||||||
|
|
||||||
if( im_writeline( 0, out, (VipsPel *) buf ) )
|
|
||||||
return( -1 );
|
|
||||||
|
|
||||||
for( y = 1; y < out->Ysize; y++ ) {
|
|
||||||
p = half_complex + y * half_width * 2;
|
|
||||||
q = buf;
|
|
||||||
|
|
||||||
for( x = 0; x < half_width; x++ ) {
|
|
||||||
q[0] = p[0] / size;
|
|
||||||
q[1] = p[1] / size;
|
|
||||||
p += 2;
|
|
||||||
q += 2;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* Good grief.
|
|
||||||
*/
|
|
||||||
p = half_complex + 2 *
|
|
||||||
((out->Ysize - y + 1) * half_width - 2 +
|
|
||||||
(in->Xsize & 1));
|
|
||||||
|
|
||||||
for( x = half_width; x < out->Xsize; x++ ) {
|
|
||||||
q[0] = p[0] / size;
|
|
||||||
q[1] = -1.0 * p[1] / size;
|
|
||||||
p -= 2;
|
|
||||||
q += 2;
|
|
||||||
}
|
|
||||||
|
|
||||||
if( im_writeline( y, out, (VipsPel *) buf ) )
|
|
||||||
return( -1 );
|
|
||||||
}
|
|
||||||
|
|
||||||
return( 0 );
|
|
||||||
}
|
|
||||||
|
|
||||||
/* Call fftw for a 1 band complex image.
|
|
||||||
*/
|
|
||||||
static int
|
|
||||||
cfwfft1( IMAGE *dummy, IMAGE *in, IMAGE *out )
|
|
||||||
{
|
|
||||||
fftwnd_plan plan;
|
|
||||||
double *buf, *q, *p;
|
|
||||||
int x, y;
|
|
||||||
|
|
||||||
IMAGE *cmplx = im_open_local( dummy, "fwfft1:1", "t" );
|
|
||||||
|
|
||||||
/* Make dp complex image.
|
|
||||||
*/
|
|
||||||
if( !cmplx || im_pincheck( in ) || im_outcheck( out ) )
|
|
||||||
return( -1 );
|
|
||||||
if( in->Coding != IM_CODING_NONE || in->Bands != 1 ) {
|
|
||||||
im_error( "im_fwfft", _( "one band uncoded only" ) );
|
|
||||||
return( -1 );
|
|
||||||
}
|
|
||||||
if( im_clip2fmt( in, cmplx, IM_BANDFMT_DPCOMPLEX ) )
|
|
||||||
return( -1 );
|
|
||||||
|
|
||||||
/* Make the plan for the transform.
|
|
||||||
*/
|
|
||||||
if( !(plan = fftw2d_create_plan( in->Ysize, in->Xsize,
|
|
||||||
FFTW_FORWARD,
|
|
||||||
FFTW_MEASURE | FFTW_USE_WISDOM | FFTW_IN_PLACE )) ) {
|
|
||||||
im_error( "im_fwfft", _( "unable to create transform plan" ) );
|
|
||||||
return( -1 );
|
|
||||||
}
|
|
||||||
|
|
||||||
fftwnd_one( plan, (fftw_complex *) cmplx->data, NULL );
|
|
||||||
|
|
||||||
fftwnd_destroy_plan( plan );
|
|
||||||
|
|
||||||
/* WIO to out.
|
|
||||||
*/
|
|
||||||
if( im_cp_desc( out, in ) )
|
|
||||||
return( -1 );
|
|
||||||
out->BandFmt = IM_BANDFMT_DPCOMPLEX;
|
|
||||||
if( im_setupout( out ) )
|
|
||||||
return( -1 );
|
|
||||||
if( !(buf = (double *) IM_ARRAY( dummy,
|
|
||||||
IM_IMAGE_SIZEOF_LINE( out ), VipsPel )) )
|
|
||||||
return( -1 );
|
|
||||||
|
|
||||||
/* Copy to out, normalise.
|
|
||||||
*/
|
|
||||||
for( p = (double *) cmplx->data, y = 0; y < out->Ysize; y++ ) {
|
|
||||||
guint64 size = VIPS_IMAGE_N_PELS( out );
|
|
||||||
|
|
||||||
q = buf;
|
|
||||||
|
|
||||||
for( x = 0; x < out->Xsize; x++ ) {
|
|
||||||
q[0] = p[0] / size;
|
|
||||||
q[1] = p[1] / size;
|
|
||||||
p += 2;
|
|
||||||
q += 2;
|
|
||||||
}
|
|
||||||
|
|
||||||
if( im_writeline( y, out, (VipsPel *) buf ) )
|
|
||||||
return( -1 );
|
|
||||||
}
|
|
||||||
|
|
||||||
return( 0 );
|
|
||||||
}
|
|
||||||
|
|
||||||
static int
|
|
||||||
fwfft1( IMAGE *dummy, IMAGE *in, IMAGE *out )
|
|
||||||
{
|
|
||||||
if( im_iscomplex( in ) )
|
|
||||||
return( cfwfft1( dummy, in, out ) );
|
|
||||||
else
|
|
||||||
return( rfwfft1( dummy, in, out ) );
|
|
||||||
}
|
|
||||||
|
|
||||||
#elif defined HAVE_FFTW3
|
|
||||||
|
|
||||||
/* Real to complex forward transform.
|
/* Real to complex forward transform.
|
||||||
*/
|
*/
|
||||||
static int
|
static int
|
||||||
@ -282,37 +88,34 @@ rfwfft1( IMAGE *dummy, IMAGE *in, IMAGE *out )
|
|||||||
const guint64 size = VIPS_IMAGE_N_PELS( in );
|
const guint64 size = VIPS_IMAGE_N_PELS( in );
|
||||||
const int half_width = in->Xsize / 2 + 1;
|
const int half_width = in->Xsize / 2 + 1;
|
||||||
|
|
||||||
/* Pack to double real here.
|
IMAGE *real;
|
||||||
*/
|
double *half_complex;
|
||||||
IMAGE *real = im_open_local( dummy, "fwfft1:1", "t" );
|
double *planner_scratch;
|
||||||
|
|
||||||
/* Transform to halfcomplex here.
|
|
||||||
*/
|
|
||||||
double *half_complex = IM_ARRAY( dummy,
|
|
||||||
in->Ysize * half_width * 2, double );
|
|
||||||
|
|
||||||
/* We have to have a separate real buffer for the planner to work on.
|
|
||||||
*/
|
|
||||||
double *planner_scratch = IM_ARRAY( dummy,
|
|
||||||
VIPS_IMAGE_N_PELS( in ), double );
|
|
||||||
|
|
||||||
fftw_plan plan;
|
fftw_plan plan;
|
||||||
double *buf, *q, *p;
|
double *buf, *q, *p;
|
||||||
int x, y;
|
int x, y;
|
||||||
|
|
||||||
if( !real || !half_complex || im_pincheck( in ) || im_outcheck( out ) )
|
if( vips_check_mono( "im_fwfft", in ) ||
|
||||||
|
vips_check_uncoded( "im_fwfft", in ) )
|
||||||
return( -1 );
|
return( -1 );
|
||||||
if( in->Coding != IM_CODING_NONE || in->Bands != 1 ) {
|
|
||||||
im_error( "im_fwfft", "%s", _( "one band uncoded only" ) );
|
/* Convert input to a real double membuffer.
|
||||||
return( -1 );
|
*/
|
||||||
}
|
if( !(real = im_open_local( dummy, "fwfft1:1", "t" )) ||
|
||||||
if( im_clip2fmt( in, real, IM_BANDFMT_DOUBLE ) )
|
im_clip2fmt( in, real, IM_BANDFMT_DOUBLE ) )
|
||||||
return( -1 );
|
return( -1 );
|
||||||
|
|
||||||
/* Make the plan for the transform. Yes, they really do use nx for
|
/* Make the plan for the transform. Yes, they really do use nx for
|
||||||
* height and ny for width. Use a separate scratch buffer for the
|
* height and ny for width. Use a separate scratch buffer for the
|
||||||
* planner, we can't overwrite real->data
|
* planner, we can't overwrite real->data
|
||||||
*/
|
*/
|
||||||
|
if( !(planner_scratch = IM_ARRAY( dummy,
|
||||||
|
VIPS_IMAGE_N_PELS( in ), double )) )
|
||||||
|
return( -1 );
|
||||||
|
if( !(half_complex = IM_ARRAY( dummy,
|
||||||
|
in->Ysize * half_width * 2, double )) )
|
||||||
|
return( -1 );
|
||||||
if( !(plan = fftw_plan_dft_r2c_2d( in->Ysize, in->Xsize,
|
if( !(plan = fftw_plan_dft_r2c_2d( in->Ysize, in->Xsize,
|
||||||
planner_scratch, (fftw_complex *) half_complex,
|
planner_scratch, (fftw_complex *) half_complex,
|
||||||
0 )) ) {
|
0 )) ) {
|
||||||
@ -321,6 +124,8 @@ rfwfft1( IMAGE *dummy, IMAGE *in, IMAGE *out )
|
|||||||
return( -1 );
|
return( -1 );
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if( im_incheck( real ) )
|
||||||
|
return( -1 );
|
||||||
fftw_execute_dft_r2c( plan,
|
fftw_execute_dft_r2c( plan,
|
||||||
(double *) real->data, (fftw_complex *) half_complex );
|
(double *) real->data, (fftw_complex *) half_complex );
|
||||||
|
|
||||||
@ -400,27 +205,28 @@ rfwfft1( IMAGE *dummy, IMAGE *in, IMAGE *out )
|
|||||||
static int
|
static int
|
||||||
cfwfft1( IMAGE *dummy, IMAGE *in, IMAGE *out )
|
cfwfft1( IMAGE *dummy, IMAGE *in, IMAGE *out )
|
||||||
{
|
{
|
||||||
|
IMAGE *cmplx;
|
||||||
fftw_plan plan;
|
fftw_plan plan;
|
||||||
|
double *planner_scratch;
|
||||||
double *buf, *q, *p;
|
double *buf, *q, *p;
|
||||||
int x, y;
|
int x, y;
|
||||||
|
|
||||||
IMAGE *cmplx = im_open_local( dummy, "fwfft1:1", "t" );
|
if( vips_check_mono( "im_fwfft", in ) ||
|
||||||
|
vips_check_uncoded( "im_fwfft", in ) )
|
||||||
|
return( -1 );
|
||||||
|
|
||||||
|
if( !(cmplx = im_open_local( dummy, "fwfft1:1", "t" )) ||
|
||||||
|
im_pincheck( in ) ||
|
||||||
|
im_outcheck( out ) )
|
||||||
|
return( -1 );
|
||||||
|
|
||||||
|
if( im_clip2fmt( in, cmplx, IM_BANDFMT_DPCOMPLEX ) )
|
||||||
|
return( -1 );
|
||||||
|
|
||||||
/* We have to have a separate buffer for the planner to work on.
|
/* We have to have a separate buffer for the planner to work on.
|
||||||
*/
|
*/
|
||||||
double *planner_scratch = IM_ARRAY( dummy,
|
if( !(planner_scratch = IM_ARRAY( dummy,
|
||||||
VIPS_IMAGE_N_PELS( in ) * 2, double );
|
VIPS_IMAGE_N_PELS( in ) * 2, double )) )
|
||||||
|
|
||||||
/* Make dp complex image.
|
|
||||||
*/
|
|
||||||
if( !cmplx || im_pincheck( in ) || im_outcheck( out ) )
|
|
||||||
return( -1 );
|
|
||||||
if( in->Coding != IM_CODING_NONE || in->Bands != 1 ) {
|
|
||||||
im_error( "im_fwfft",
|
|
||||||
"%s", _( "one band uncoded only" ) );
|
|
||||||
return( -1 );
|
|
||||||
}
|
|
||||||
if( im_clip2fmt( in, cmplx, IM_BANDFMT_DPCOMPLEX ) )
|
|
||||||
return( -1 );
|
return( -1 );
|
||||||
|
|
||||||
/* Make the plan for the transform.
|
/* Make the plan for the transform.
|
||||||
@ -495,22 +301,39 @@ fwfft1( IMAGE *dummy, IMAGE *in, IMAGE *out )
|
|||||||
#endif
|
#endif
|
||||||
|
|
||||||
/* Transform an n-band image with a 1-band processing function.
|
/* Transform an n-band image with a 1-band processing function.
|
||||||
|
*
|
||||||
|
* Memory strategy: we need memory buffers for the input and the output of
|
||||||
|
* fftw. In some modes fftw generates only half the output and we construct
|
||||||
|
* the rest.
|
||||||
|
*
|
||||||
|
* input pipeline ->
|
||||||
|
* bandsplit ->
|
||||||
|
* full memory image, freed when im_*fft*() exits ->
|
||||||
|
* fftw ->
|
||||||
|
* half memory image, freed when im_*fft*() exits ->
|
||||||
|
* full memory image, freed when @out is freed ->
|
||||||
|
* partial bandjoin ->
|
||||||
|
* output pipeline
|
||||||
|
*
|
||||||
|
* im__fftproc() needs to just call im__fftproc_fn directly for 1 band images,
|
||||||
|
* so we can't cache the output in this fn.
|
||||||
*/
|
*/
|
||||||
int
|
int
|
||||||
im__fftproc( IMAGE *dummy, IMAGE *in, IMAGE *out, im__fftproc_fn fn )
|
im__fftproc( IMAGE *dummy, IMAGE *in, IMAGE *out, im__fftproc_fn fn )
|
||||||
{
|
{
|
||||||
IMAGE **bands;
|
IMAGE **bands;
|
||||||
IMAGE **fft;
|
IMAGE **fft;
|
||||||
IMAGE *t;
|
|
||||||
int b;
|
int b;
|
||||||
|
|
||||||
if( in->Bands == 1 )
|
if( in->Bands == 1 )
|
||||||
return( fn( dummy, in, out ) );
|
return( fn( dummy, in, out ) );
|
||||||
|
|
||||||
if( !(bands = IM_ARRAY( dummy, in->Bands, IMAGE * )) ||
|
if( !(bands = IM_ARRAY( dummy, in->Bands, IMAGE * )) ||
|
||||||
!(fft = IM_ARRAY( dummy, in->Bands, IMAGE * )) ||
|
im_open_local_array( dummy, bands, in->Bands, "bands", "p" ) )
|
||||||
im_open_local_array( dummy, bands, in->Bands, "bands", "p" ) ||
|
return( -1 );
|
||||||
im_open_local_array( dummy, fft, in->Bands, "fft", "p" ) )
|
|
||||||
|
if( !(fft = IM_ARRAY( out, in->Bands, IMAGE * )) ||
|
||||||
|
im_open_local_array( out, fft, in->Bands, "fft", "p" ) )
|
||||||
return( -1 );
|
return( -1 );
|
||||||
|
|
||||||
for( b = 0; b < in->Bands; b++ )
|
for( b = 0; b < in->Bands; b++ )
|
||||||
@ -518,12 +341,7 @@ im__fftproc( IMAGE *dummy, IMAGE *in, IMAGE *out, im__fftproc_fn fn )
|
|||||||
fn( dummy, bands[b], fft[b] ) )
|
fn( dummy, bands[b], fft[b] ) )
|
||||||
return( -1 );
|
return( -1 );
|
||||||
|
|
||||||
/* We need a "t" for the combined image that won't get freed too
|
if( im_gbandjoin( fft, out, in->Bands ) )
|
||||||
* quickly.
|
|
||||||
*/
|
|
||||||
if( !(t = im_open_local( out, "im__fftproc", "t" )) ||
|
|
||||||
im_gbandjoin( fft, t, in->Bands ) ||
|
|
||||||
im_copy( t, out ) )
|
|
||||||
return( -1 );
|
return( -1 );
|
||||||
|
|
||||||
return( 0 );
|
return( 0 );
|
||||||
@ -536,10 +354,8 @@ im__fftproc( IMAGE *dummy, IMAGE *in, IMAGE *out, im__fftproc_fn fn )
|
|||||||
*
|
*
|
||||||
* Transform an image to Fourier space.
|
* Transform an image to Fourier space.
|
||||||
*
|
*
|
||||||
* VIPS uses the fftw3 or fftw2 Fourier transform libraries if possible. If
|
* VIPS uses the fftw Fourier Transform library. If this library was not
|
||||||
* they were not available when VIPS was built, it falls back to it's own
|
* available when VIPS was configured, these functions will fail.
|
||||||
* FFT functions which are slow and only work for square images whose sides
|
|
||||||
* are a power of two.
|
|
||||||
*
|
*
|
||||||
* See also: im_invfft(), im_disp_ps().
|
* See also: im_invfft(), im_disp_ps().
|
||||||
*
|
*
|
||||||
|
@ -61,65 +61,14 @@
|
|||||||
#include <math.h>
|
#include <math.h>
|
||||||
|
|
||||||
#ifdef HAVE_FFTW
|
#ifdef HAVE_FFTW
|
||||||
#include <fftw.h>
|
|
||||||
#endif /*HAVE_FFTW*/
|
|
||||||
|
|
||||||
#ifdef HAVE_FFTW3
|
|
||||||
#include <fftw3.h>
|
#include <fftw3.h>
|
||||||
#endif /*HAVE_FFTW3*/
|
#endif /*HAVE_FFTW*/
|
||||||
|
|
||||||
#include <vips/vips.h>
|
#include <vips/vips.h>
|
||||||
#include <vips/internal.h>
|
#include <vips/internal.h>
|
||||||
|
|
||||||
#ifdef HAVE_FFTW
|
#ifdef HAVE_FFTW
|
||||||
|
|
||||||
/* Call fftw for a 1 band image.
|
|
||||||
*/
|
|
||||||
static int
|
|
||||||
invfft1( IMAGE *dummy, IMAGE *in, IMAGE *out )
|
|
||||||
{
|
|
||||||
fftwnd_plan plan;
|
|
||||||
|
|
||||||
IMAGE *cmplx = im_open_local( out, "invfft1:1", "t" );
|
|
||||||
|
|
||||||
/* Make dp complex image.
|
|
||||||
*/
|
|
||||||
if( !cmplx || im_pincheck( in ) || im_poutcheck( out ) )
|
|
||||||
return( -1 );
|
|
||||||
if( in->Coding != IM_CODING_NONE || in->Bands != 1 ) {
|
|
||||||
im_error( "im_invfft", "%s", _( "one band uncoded only" ) );
|
|
||||||
return( -1 );
|
|
||||||
}
|
|
||||||
if( im_clip2fmt( in, cmplx, IM_BANDFMT_DPCOMPLEX ) )
|
|
||||||
return( -1 );
|
|
||||||
|
|
||||||
/* Make the plan for the transform. Yes, they really do use nx for
|
|
||||||
* height and ny for width.
|
|
||||||
*/
|
|
||||||
if( !(plan = fftw2d_create_plan( in->Ysize, in->Xsize,
|
|
||||||
FFTW_BACKWARD,
|
|
||||||
FFTW_MEASURE | FFTW_USE_WISDOM | FFTW_IN_PLACE )) ) {
|
|
||||||
im_error( "im_invfft",
|
|
||||||
"%s", _( "unable to create transform plan" ) );
|
|
||||||
return( -1 );
|
|
||||||
}
|
|
||||||
|
|
||||||
fftwnd_one( plan, (fftw_complex *) cmplx->data, NULL );
|
|
||||||
|
|
||||||
fftwnd_destroy_plan( plan );
|
|
||||||
|
|
||||||
cmplx->Type = IM_TYPE_B_W;
|
|
||||||
|
|
||||||
/* Copy to out.
|
|
||||||
*/
|
|
||||||
if( im_copy( cmplx, out ) )
|
|
||||||
return( -1 );
|
|
||||||
|
|
||||||
return( 0 );
|
|
||||||
}
|
|
||||||
|
|
||||||
#elif defined HAVE_FFTW3
|
|
||||||
|
|
||||||
/* Complex to complex inverse transform.
|
/* Complex to complex inverse transform.
|
||||||
*/
|
*/
|
||||||
static int
|
static int
|
||||||
|
@ -49,98 +49,14 @@
|
|||||||
#include <math.h>
|
#include <math.h>
|
||||||
|
|
||||||
#ifdef HAVE_FFTW
|
#ifdef HAVE_FFTW
|
||||||
#include <rfftw.h>
|
|
||||||
#endif /*HAVE_FFTW*/
|
|
||||||
|
|
||||||
#ifdef HAVE_FFTW3
|
|
||||||
#include <fftw3.h>
|
#include <fftw3.h>
|
||||||
#endif /*HAVE_FFTW3*/
|
#endif /*HAVE_FFTW*/
|
||||||
|
|
||||||
#include <vips/vips.h>
|
#include <vips/vips.h>
|
||||||
#include <vips/internal.h>
|
#include <vips/internal.h>
|
||||||
|
|
||||||
#ifdef HAVE_FFTW
|
#ifdef HAVE_FFTW
|
||||||
|
|
||||||
/* Use fftw2.
|
|
||||||
*/
|
|
||||||
static int
|
|
||||||
invfft1( IMAGE *dummy, IMAGE *in, IMAGE *out )
|
|
||||||
{
|
|
||||||
IMAGE *cmplx = im_open_local( dummy, "invfft1-1", "t" );
|
|
||||||
IMAGE *real = im_open_local( out, "invfft1-2", "t" );
|
|
||||||
const int half_width = in->Xsize / 2 + 1;
|
|
||||||
|
|
||||||
/* Transform to halfcomplex here.
|
|
||||||
*/
|
|
||||||
double *half_complex = IM_ARRAY( dummy,
|
|
||||||
in->Ysize * half_width * 2, double );
|
|
||||||
|
|
||||||
rfftwnd_plan plan;
|
|
||||||
int x, y;
|
|
||||||
double *q, *p;
|
|
||||||
|
|
||||||
if( !cmplx || !real || !half_complex || im_pincheck( in ) ||
|
|
||||||
im_poutcheck( out ) )
|
|
||||||
return( -1 );
|
|
||||||
if( in->Coding != IM_CODING_NONE || in->Bands != 1 ) {
|
|
||||||
im_error( "im_invfft", _( "one band uncoded only" ) );
|
|
||||||
return( -1 );
|
|
||||||
}
|
|
||||||
|
|
||||||
/* Make dp complex image for input.
|
|
||||||
*/
|
|
||||||
if( im_clip2fmt( in, cmplx, IM_BANDFMT_DPCOMPLEX ) )
|
|
||||||
return( -1 );
|
|
||||||
|
|
||||||
/* Build half-complex image.
|
|
||||||
*/
|
|
||||||
if( im_incheck( cmplx ) )
|
|
||||||
return( -1 );
|
|
||||||
q = half_complex;
|
|
||||||
for( y = 0; y < cmplx->Ysize; y++ ) {
|
|
||||||
p = ((double *) cmplx->data) + (guint64) y * in->Xsize * 2;
|
|
||||||
|
|
||||||
for( x = 0; x < half_width; x++ ) {
|
|
||||||
q[0] = p[0];
|
|
||||||
q[1] = p[1];
|
|
||||||
p += 2;
|
|
||||||
q += 2;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
/* Make mem buffer real image for output.
|
|
||||||
*/
|
|
||||||
if( im_cp_desc( real, in ) )
|
|
||||||
return( -1 );
|
|
||||||
real->BandFmt = IM_BANDFMT_DOUBLE;
|
|
||||||
real->Type = IM_TYPE_B_W;
|
|
||||||
if( im_setupout( real ) )
|
|
||||||
return( -1 );
|
|
||||||
|
|
||||||
/* Make the plan for the transform. Yes, they really do use nx for
|
|
||||||
* height and ny for width.
|
|
||||||
*/
|
|
||||||
if( !(plan = rfftw2d_create_plan( in->Ysize, in->Xsize,
|
|
||||||
FFTW_BACKWARD, FFTW_MEASURE | FFTW_USE_WISDOM )) ) {
|
|
||||||
im_error( "im_invfft", _( "unable to create transform plan" ) );
|
|
||||||
return( -1 );
|
|
||||||
}
|
|
||||||
|
|
||||||
rfftwnd_one_complex_to_real( plan,
|
|
||||||
(fftw_complex *) half_complex, (fftw_real *) real->data );
|
|
||||||
|
|
||||||
rfftwnd_destroy_plan( plan );
|
|
||||||
|
|
||||||
/* Copy to out.
|
|
||||||
*/
|
|
||||||
if( im_copy( real, out ) )
|
|
||||||
return( -1 );
|
|
||||||
|
|
||||||
return( 0 );
|
|
||||||
}
|
|
||||||
|
|
||||||
#elif defined HAVE_FFTW3
|
|
||||||
|
|
||||||
/* Complex to real inverse transform.
|
/* Complex to real inverse transform.
|
||||||
*/
|
*/
|
||||||
static int
|
static int
|
||||||
|
Loading…
Reference in New Issue
Block a user