Page MenuHomec4science

d_seeing_omp.c
No OneTemporary

File Metadata

Created
Fri, Jan 17, 00:48

d_seeing_omp.c

This document is not UTF8. It was detected as Shift JIS and converted to UTF8 for display.
//d_seeing_omp.c
//
// name of main function: d_seeing_omp
// author: Sergey Rodionov (astroseger@gmail.com)
// date: 01/2012
// place: Marseille
//
//function for fast add seeing to images by means of fft
//principal function is the last function
//ATTENTION!!! WE USE GLOBAL VARIABLES FOR OPTIMISATION REASONS
//so don't remove check_not_in_parallel();
//because historical reason we have nx, ny swapped in respect to lenstool
//here -- im[0..nx][0..ny] ... in lenstool im[0..ny][0..nx]
#include <gsl/gsl_fft_complex.h>
#include <stdio.h>
#include <stdlib.h>
#include "structure.h"
#include "lt.h"
struct cpa2d; //predifiniton of cpa2d (see below)
//ATTENTION!!!! GLOBAL VARIABLES
//fourier transformation of psf
//psf_f->nx, psf_f->ny --- sizes of our image!
static struct cpa2d* psf_f = NULL;
//preallocated "padded" image
//(we only us it directly from d_seeing_omp)
static struct cpa2d* pim_global = NULL;
//structure which keep parameters for which psf_f as constructed
//(just to check that it haven't been changed)
static struct g_observ O_psf_f;
//nx, ny and scale for first run (in addition to O_psf_f)
static int nx_init, ny_init;
static double scale_init;
//wavetables and workspaces for fourier trasform
// *_x - for psf->nx
// *_y - for psf->ny
//for each row or column --- separeated workspace
static gsl_fft_complex_wavetable * wt_x;
static gsl_fft_complex_wavetable * wt_y;
static gsl_fft_complex_workspace **ws_x; //size psf_f->ny !!! (reverse!)
static gsl_fft_complex_workspace **ws_y; //size psf_f->nx !!! (reserse!)
//gsl "complex packed array" in 2D. For 2D fourier trasform
struct cpa2d
{
double* v;
int nx;
int ny;
};
//
//several basic function for the access to cpa2d, and allocate/free of it
static struct cpa2d* cpa2d_alloc(int nx, int ny)
{
struct cpa2d* c = (struct cpa2d*) malloc(sizeof(struct cpa2d*));
c->v = (double*) malloc(sizeof(double) * nx * ny * 2);
c->nx = nx;
c->ny = ny;
return c;
}
//
static void cpa2d_free(struct cpa2d* c)
{
free(c->v);
free(c);
}
//
inline void cpa2d_set(struct cpa2d* c, int i, int j, double re, double im)
{
c->v[(i * c->ny + j) * 2] = re;
c->v[(i * c->ny + j) * 2 + 1] = im;
}
//
inline void cpa2d_set_re(struct cpa2d* c, int i, int j, double re)
{
c->v[(i * c->ny + j) * 2] = re;
}
//
inline double cpa2d_get_re(struct cpa2d* c, int i, int j)
{
return c->v[(i * c->ny + j) * 2];
}
//
inline double cpa2d_get_im(struct cpa2d* c, int i, int j)
{
return c->v[(i * c->ny + j) * 2 + 1];
}
//
//from im (nx,ny) to pim (pim->nx,pim->ny) with zero padding
static void zero_padding(double **im, int nx, int ny,
struct cpa2d* pim)
{
if (pim->nx <= nx || pim->ny <= ny)
{
fprintf(stderr, "error | zero_paddinig | pim->nx <= nx || pim->ny <= ny\n");
exit(EXIT_FAILURE);
}
int px = (pim->nx - nx) / 2;
int py = (pim->ny - ny) / 2;
int i;
#pragma omp parallel for schedule(static)
for (i = 0 ; i < pim->nx ; i++)
{
int j;
for (j = 0 ; j < pim->ny ; j++)
{
if ((i >= px) && (i < px + nx) &&
(j >= py) && (j < py + ny))
{
cpa2d_set(pim, i, j, im[i - px][j - py], 0);
}
else
{
cpa2d_set(pim, i, j, 0, 0);
}
}
}
}
//from pim to im (unpadding and "unsplitting")
//We take into account "splitting" in pim
//if cntrx, cntry - is position of maximum in psf
//and it is center of "splitting"
static void split_unpadding(double **im, int nx, int ny,
struct cpa2d* pim)
{
int px = (pim->nx - nx) / 2;
int py = (pim->ny - ny) / 2;
//calculate position of center in psf
//for odd center in n/2
//for even center in (n - 0.5)/2
int cntrx = (int)floor((pim->nx - 0.5) / 2.0);
int cntry = (int) floor((pim->ny - 0.5) / 2.0);
int i;
#pragma omp parallel for schedule(static)
for (i = px ; i < px + nx ; i++)
{
int j;
for (j = py ; j < py + ny ; j++)
{
int ip, jp;
ip = i;
jp = j;
//splitting
if (i < pim->nx - cntrx)
ip = i + cntrx;
else
ip = i - (pim->nx - cntrx);
if (j < pim->ny - cntry)
jp = j + cntry;
else
jp = j - (pim->ny - cntry);
//unpadding
im[i - px][j - py] = cpa2d_get_re(pim, ip, jp);
}
}
}
//two simple function for 2D fast fourier trasform (direct and invert)
//ATENTIANON this two function use global variables
static void fft_2D_omp(struct cpa2d* data)
{
int i;
#pragma omp parallel for schedule(static)
for (i = 0 ; i < data->nx ; i++)
{
gsl_fft_complex_forward(data->v + data->ny * i * 2, 1, data->ny,
wt_y, ws_y[i]);
}
#pragma omp parallel for schedule(static)
for (i = 0 ; i < data->ny ; i++)
{
gsl_fft_complex_forward(data->v + i * 2, data->ny,
data->nx, wt_x, ws_x[i]);
}
}
//
static void fft_2D_inv_omp(struct cpa2d* data)
{
int i;
#pragma omp parallel for schedule(static)
for (i = 0 ; i < data->nx ; i++)
{
gsl_fft_complex_inverse(data->v + data->ny * i * 2, 1,
data->ny, wt_y, ws_y[i]);
}
#pragma omp parallel for schedule(static)
for (i = 0 ; i < data->ny ; i++)
{
gsl_fft_complex_inverse(data->v + i * 2, data->ny,
data->nx, wt_x, ws_x[i]);
}
}
// ム
//we choose smallest number greater than n for which gsl fft is fast
//(biggest factor should be equal to 7. see gsl documentation)
static int choose_fast_fft_n(int n)
{
const int primes[4] = {2, 3, 5, 7};
const int primes_n = 4;
int det = 0;
do
{
int tmp = n;
int i;
for (i = 0 ; i < primes_n ; i++)
while (tmp % primes[i] == 0)
tmp /= primes[i];
if (tmp == 1)
det = 1;
else
n++;
}
while (!det);
return n;
}
//
static void create_psf_psffile(double***spsf, int* nx, int* ny)
{
char* header;
const extern struct g_observ O;
//again nx and ny should be swapped here
*spsf = rdf_fits((char*)O.psffile, ny, nx, &header);
free(header);
//check maximum (it should be at nx/2 ny/2)
int max_i = *nx / 2;
int max_j = *ny / 2;
int i,j;
for (i = 0 ; i < *nx ; i++)
for (j = 0 ; j < *ny; j++)
{
if ((*spsf)[i][j] > (*spsf)[max_i][max_j])
{
fprintf(stderr, "Error | d_seeing_omp/create_psf_psffile | maximum is not located in center of psf\n");
exit(EXIT_FAILURE);
}
}
//normalization
long double sum = 0;
for (i = 0 ; i < *nx ; i++)
for (j = 0 ; j < *ny ; j++)
sum += (*spsf)[i][j];
for (i = 0 ; i < *nx ; i++)
for (j = 0 ; j < *ny ; j++)
{
(*spsf)[i][j] /= sum;
}
}
//
static void create_psf_create_filtre(double scale, int big_n, double***spsf, int* nx, int*ny)
{
int i,j;
const double PSF_ZERO = 1e-20;
const extern struct g_observ O;
//create_filtre work correctly only for even n
if (big_n % 2 != 0)
big_n++;
double** psf = (double **) alloc_square_double(big_n, big_n);
if (O.filtre)
{
fprintf(stderr, "Error | d_seeing_omp.c/create_psf | O.filtre != 0 we don't know what it means");
exit(EXIT_FAILURE);
}
if (O.setseeing == 1)
{
crea_filtre(O.seeing, scale, psf, big_n);
}
else if (O.setseeing == 2)
{
crea_filtre_e(O.seeing_a, O.seeing_b, O.seeing_angle, scale, psf, big_n);
}
else
{
fprintf(stderr, "Error | d_seeing_omp.c/create_psf | unknown O.setseeing = %d", O.setseeing);
exit(EXIT_FAILURE);
}
//just in case we check maximum value (it should be in big_n/2)
int max_i = big_n / 2;
for (i = 0 ; i < big_n ; i++)
for (j = 0 ; j < big_n; j++)
if (psf[i][j] > psf[max_i][max_i])
{
fprintf(stderr, "Unexpected behavior of crea_filtre\n");
exit(EXIT_FAILURE);
}
//now we can try to shrink psf
int si = 1;
int sj = 1;
int det = 1;
do
{
for (j = 0 ; j < big_n ; j++)
{
if (psf[si][j] > PSF_ZERO || psf[2 * max_i - si][j] > PSF_ZERO)
det = 0;
}
if (det)
si++;
if (si == max_i)
{
fprintf(stderr, "Unexpected behavior 3 of crea_filtre\n");
exit(EXIT_FAILURE);
}
}
while (det);
det = 1;
do
{
for (i = 0 ; i < big_n ; i++)
{
if (psf[i][sj] > PSF_ZERO || psf[i][2 * max_i - sj] > PSF_ZERO)
det = 0;
}
if (det)
sj++;
if (sj == max_i)
{
fprintf(stderr, "Unexpected behavior 3 of crea_filtre\n");
exit(EXIT_FAILURE);
}
}
while (det);
*nx = (max_i - si) * 2 + 1;
*ny = (max_i - sj) * 2 + 1;
(*spsf) = (double **) alloc_square_double(*nx, *ny);
long double sum = 0;
for (i = 0 ; i < *nx ; i++)
for (j = 0 ; j < *ny ; j++)
{
(*spsf)[i][j] = psf[si + i][sj + j];
sum += (*spsf)[i][j];
}
for (i = 0 ; i < *nx ; i++)
for (j = 0 ; j < *ny ; j++)
{
(*spsf)[i][j] /= sum;
}
free_square_double(psf, big_n);
}
//
static void create_psf(double scale, int big_n, double***spsf, int* nx, int*ny)
{
const extern struct g_observ O;
//we also save parameters for which psf was constructed
O_psf_f = O; //we cannot use O_psf_f.psfile anymore!x
if (O.setseeing == 1 || O.setseeing == 2)
{
create_psf_create_filtre(scale, big_n, spsf, nx, ny);
}
else if (O.setseeing == 3)
{
create_psf_psffile(spsf, nx, ny);
}
else
{
fprintf(stderr, "Error | d_seeing_omp.c/create_psf | unknown O.setseeing = %d", O.setseeing);
exit(EXIT_FAILURE);
}
}
//
//because historical reason we have nx, ny swapped in respect to lenstool
//here -- im[0..nx][0..ny] ... in lenstool im[0..ny][0..nx]
//ATTENTIAON!!! because of these nx ny was swapped here !!!
void d_seeing_omp(double **im, int ny, int nx, double scale)
{
//we must not be in parallel now
check_not_in_parallel("d_seeing_omp");
int i;
if (psf_f == NULL) //first run
{
double** psf;
int nx_psf,ny_psf;
//create psf and save parameters for which it was constructed
create_psf(scale, nx + 1, &psf, &nx_psf, &ny_psf);
//save value of nx and ny of first run
nx_init = nx;
ny_init = ny;
//save scale parameter of first run
scale_init = scale;
//we should add "zero" padding of size at least nx_psf/2 (ny_psf/2)
//this value is exactly equal to size of wings of psf...
//and after we search appropriative size of array for which fft
//could be calculated fast
int nx1 = choose_fast_fft_n(nx + nx_psf / 2);
int ny1 = choose_fast_fft_n(ny + ny_psf / 2);
// printf("nx=%d ny=%d nx_psf=%d ny_psf=%d nx1=%d ny1=%d\n",
// nx, ny, nx_psf, ny_psf, nx1, ny1);
//now we can allocated wavetables and workspaces for fft
wt_x = gsl_fft_complex_wavetable_alloc (nx1);
wt_y = gsl_fft_complex_wavetable_alloc (ny1);
ws_x = (gsl_fft_complex_workspace**)
malloc(sizeof(gsl_fft_complex_workspace*) * ny1);
ws_y = (gsl_fft_complex_workspace**)
malloc(sizeof(gsl_fft_complex_workspace*) * nx1);
for (i = 0 ; i < ny1 ; i++)
ws_x[i] = gsl_fft_complex_workspace_alloc (nx1);
for (i = 0 ; i < nx1 ; i++)
ws_y[i] = gsl_fft_complex_workspace_alloc (ny1);
//calculate fft of psf
psf_f = cpa2d_alloc(nx1, ny1);
zero_padding(psf, nx_psf, ny_psf, psf_f);
fft_2D_omp(psf_f);
//and finally allocated padded image with which we will work
pim_global = cpa2d_alloc(psf_f->nx, psf_f->ny);
//real psf we will not need anymore
free_square_double(psf, nx_psf);
}
else
{
//we just check that noting have changed after initialisation
const extern struct g_observ O;
if (nx != nx_init || ny != ny_init || scale != scale_init)
{
fprintf(stderr, "Error | d_seeing_omp.c/d_seeing_omp | nx, ny or scale have been changed from first run");
exit(EXIT_FAILURE);
}
if (O.setseeing != O_psf_f.setseeing ||
O.seeing != O_psf_f.seeing ||
O.seeing_a != O_psf_f.seeing_a ||
O.seeing_b != O_psf_f.seeing_b ||
O.seeing_angle != O_psf_f.seeing_angle )
{
fprintf(stderr, "Error | d_seeing_omp.c/d_seeing_omp | O structure have been changed from first run");
exit(EXIT_FAILURE);
}
}
//Now we can start main part of algorim
//psf_f->nx and psf_f->ny keep dimension of padded image
struct cpa2d* pim = pim_global; //just for simplicity
zero_padding(im, nx, ny, pim);
fft_2D_omp(pim);
//simple multiplication of pim and psf_f
//(see basic theory of convolution)
#pragma omp parallel for schedule(static)
for (i = 0 ; i < pim->nx * pim->ny * 2 ; i += 2)
{
double rr = pim->v[i] * psf_f->v[i] - pim->v[i + 1] * psf_f->v[i + 1];
double ii = pim->v[i] * psf_f->v[i + 1] + pim->v[i + 1] * psf_f->v[i];
pim->v[i] = rr;
pim->v[i + 1] = ii;
}
fft_2D_inv_omp(pim);
split_unpadding(im, nx, ny, pim);
}

Event Timeline