ISCE_INSAR/contrib/PyCuAmpcor/src/cuAmpcorController.cu

/**
 * @file cuAmpcorController.cu
 * @brief Implementations of cuAmpcorController
 */

// my declaration
#include "cuAmpcorController.h"

// dependencies
#include "GDALImage.h"
#include "cuArrays.h"
#include "cudaUtil.h"
#include "cuAmpcorChunk.h"
#include "cuAmpcorUtil.h"
#include <iostream>

// constructor
cuAmpcorController::cuAmpcorController()
{
    // create a new set of parameters
    param = new cuAmpcorParameter();
}

// destructor
cuAmpcorController::~cuAmpcorController()
{
    delete param;
}


/**
 *  Run ampcor
 *
 *
 */
void cuAmpcorController::runAmpcor()
{
    // set the gpu id
    param->deviceID = gpuDeviceInit(param->deviceID);
    // initialize the gdal driver
    GDALAllRegister();
    // reference and secondary images; use band=1 as default
    // TODO: selecting band
    GDALImage *referenceImage = new GDALImage(param->referenceImageName, 1, param->mmapSizeInGB);
    GDALImage *secondaryImage = new GDALImage(param->secondaryImageName, 1, param->mmapSizeInGB);

    cuArrays<float2> *offsetImage, *offsetImageRun;
    cuArrays<float> *snrImage, *snrImageRun;
    cuArrays<float3> *covImage, *covImageRun;

    // nWindowsDownRun is defined as numberChunk * numberWindowInChunk
    // It may be bigger than the actual number of windows
    int nWindowsDownRun = param->numberChunkDown * param->numberWindowDownInChunk;
    int nWindowsAcrossRun = param->numberChunkAcross * param->numberWindowAcrossInChunk;

    offsetImageRun = new cuArrays<float2>(nWindowsDownRun, nWindowsAcrossRun);
    offsetImageRun->allocate();

    snrImageRun = new cuArrays<float>(nWindowsDownRun, nWindowsAcrossRun);
    snrImageRun->allocate();

    covImageRun = new cuArrays<float3>(nWindowsDownRun, nWindowsAcrossRun);
    covImageRun->allocate();

    // Offset fields.
    offsetImage = new cuArrays<float2>(param->numberWindowDown, param->numberWindowAcross);
    offsetImage->allocate();

    // SNR.
    snrImage = new cuArrays<float>(param->numberWindowDown, param->numberWindowAcross);
    snrImage->allocate();

    // Variance.
    covImage = new cuArrays<float3>(param->numberWindowDown, param->numberWindowAcross);
    covImage->allocate();

    // set up the cuda streams
    cudaStream_t streams[param->nStreams];
    cuAmpcorChunk *chunk[param->nStreams];
    // iterate over cuda streams
    for(int ist=0; ist<param->nStreams; ist++)
    {
        // create each stream
        checkCudaErrors(cudaStreamCreate(&streams[ist]));
        // create the chunk processor for each stream
        chunk[ist]= new cuAmpcorChunk(param, referenceImage, secondaryImage,
            offsetImageRun, snrImageRun, covImageRun,
            streams[ist]);

    }

    int nChunksDown = param->numberChunkDown;
    int nChunksAcross = param->numberChunkAcross;

    // report info
    std::cout << "Total number of windows (azimuth x range):  "
        << param->numberWindowDown << " x " << param->numberWindowAcross
        << std::endl;
    std::cout << "to be processed in the number of chunks: "
        << nChunksDown << " x " << nChunksAcross  << std::endl;

    // iterative over chunks down
    for(int i = 0; i<nChunksDown; i++)
    {
        std::cout << "Processing chunk (" << i <<", x" << ") out of " << nChunksDown << std::endl;
        // iterate over chunks across
        for(int j=0; j<nChunksAcross; j+=param->nStreams)
        {
            // iterate over cuda streams to process chunks
            for(int ist = 0; ist < param->nStreams; ist++)
            {
                int chunkIdxAcross = j+ist;
                if(chunkIdxAcross < nChunksAcross) {
                    chunk[ist]->run(i, chunkIdxAcross);
                }
            }
        }
    }

    // wait all streams are done
    cudaDeviceSynchronize();

    // extraction of the run images to output images
    cuArraysCopyExtract(offsetImageRun, offsetImage, make_int2(0,0), streams[0]);
    cuArraysCopyExtract(snrImageRun, snrImage, make_int2(0,0), streams[0]);
    cuArraysCopyExtract(covImageRun, covImage, make_int2(0,0), streams[0]);
    // save outputs to files
    offsetImage->outputToFile(param->offsetImageName, streams[0]);
    snrImage->outputToFile(param->snrImageName, streams[0]);
    covImage->outputToFile(param->covImageName, streams[0]);
    // also save the gross offsets
    outputGrossOffsets();

    // Delete arrays.
    delete offsetImage;
    delete snrImage;
    delete covImage;

    delete offsetImageRun;
    delete snrImageRun;
    delete covImageRun;

    for (int ist=0; ist<param->nStreams; ist++)
    {
        checkCudaErrors(cudaStreamDestroy(streams[ist]));
        delete chunk[ist];
    }

    delete referenceImage;
    delete secondaryImage;

}

/**
 * Output gross offset fields
 */
void cuAmpcorController::outputGrossOffsets()
{
    cuArrays<float2> *grossOffsets = new cuArrays<float2>(param->numberWindowDown, param->numberWindowAcross);
    grossOffsets->allocateHost();

    for(int i=0; i< param->numberWindows; i++)
        grossOffsets->hostData[i] = make_float2(param->grossOffsetDown[i], param->grossOffsetAcross[i]);
    grossOffsets->outputHostToFile(param->grossOffsetImageName);
    delete grossOffsets;
}

// end of file
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`/**`
			`* @file cuAmpcorController.cu`
			`* @brief Implementations of cuAmpcorController`
			`*/`
Adding all files 2019-01-16 19:40:08 +00:00
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`// my declaration`
Adding all files 2019-01-16 19:40:08 +00:00			`#include "cuAmpcorController.h"`
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00
			`// dependencies`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00			`#include "GDALImage.h"`
Adding all files 2019-01-16 19:40:08 +00:00			`#include "cuArrays.h"`
			`#include "cudaUtil.h"`
			`#include "cuAmpcorChunk.h"`
			`#include "cuAmpcorUtil.h"`
			`#include <iostream>`

PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`// constructor`
			`cuAmpcorController::cuAmpcorController()`
			`{`
			`// create a new set of parameters`
			`param = new cuAmpcorParameter();`
			`}`
Adding all files 2019-01-16 19:40:08 +00:00
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`// destructor`
			`cuAmpcorController::~cuAmpcorController()`
			`{`
			`delete param;`
			`}`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00
			`/**`
			`* Run ampcor`
			`*`
			`*`
			`*/`
			`void cuAmpcorController::runAmpcor()`
			`{`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00			`// set the gpu id`
Adding all files 2019-01-16 19:40:08 +00:00			`param->deviceID = gpuDeviceInit(param->deviceID);`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00			`// initialize the gdal driver`
			`GDALAllRegister();`
diversity: replaced oppressive language with neutral definitions of the images that comprise an interferogram through the entire repository 2020-07-02 19:40:49 +00:00			`// reference and secondary images; use band=1 as default`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00			`// TODO: selecting band`
diversity: replaced oppressive language with neutral definitions of the images that comprise an interferogram through the entire repository 2020-07-02 19:40:49 +00:00			`GDALImage *referenceImage = new GDALImage(param->referenceImageName, 1, param->mmapSizeInGB);`
			`GDALImage *secondaryImage = new GDALImage(param->secondaryImageName, 1, param->mmapSizeInGB);`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00
Adding all files 2019-01-16 19:40:08 +00:00			`cuArrays<float2> offsetImage, offsetImageRun;`
			`cuArrays<float> snrImage, snrImageRun;`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00			`cuArrays<float3> covImage, covImageRun;`

PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`// nWindowsDownRun is defined as numberChunk * numberWindowInChunk`
			`// It may be bigger than the actual number of windows`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00			`int nWindowsDownRun = param->numberChunkDown * param->numberWindowDownInChunk;`
			`int nWindowsAcrossRun = param->numberChunkAcross * param->numberWindowAcrossInChunk;`

Adding all files 2019-01-16 19:40:08 +00:00			`offsetImageRun = new cuArrays<float2>(nWindowsDownRun, nWindowsAcrossRun);`
			`offsetImageRun->allocate();`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00
			`snrImageRun = new cuArrays<float>(nWindowsDownRun, nWindowsAcrossRun);`
Adding all files 2019-01-16 19:40:08 +00:00			`snrImageRun->allocate();`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00
			`covImageRun = new cuArrays<float3>(nWindowsDownRun, nWindowsAcrossRun);`
			`covImageRun->allocate();`

PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`// Offset fields.`
Adding all files 2019-01-16 19:40:08 +00:00			`offsetImage = new cuArrays<float2>(param->numberWindowDown, param->numberWindowAcross);`
			`offsetImage->allocate();`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00
			`// SNR.`
			`snrImage = new cuArrays<float>(param->numberWindowDown, param->numberWindowAcross);`
Adding all files 2019-01-16 19:40:08 +00:00			`snrImage->allocate();`

PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00			`// Variance.`
			`covImage = new cuArrays<float3>(param->numberWindowDown, param->numberWindowAcross);`
			`covImage->allocate();`
Adding all files 2019-01-16 19:40:08 +00:00
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`// set up the cuda streams`
Adding all files 2019-01-16 19:40:08 +00:00			`cudaStream_t streams[param->nStreams];`
			`cuAmpcorChunk *chunk[param->nStreams];`
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`// iterate over cuda streams`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00			`for(int ist=0; ist<param->nStreams; ist++)`
Adding all files 2019-01-16 19:40:08 +00:00			`{`
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`// create each stream`
			`checkCudaErrors(cudaStreamCreate(&streams[ist]));`
			`// create the chunk processor for each stream`
			`chunk[ist]= new cuAmpcorChunk(param, referenceImage, secondaryImage,`
			`offsetImageRun, snrImageRun, covImageRun,`
PyCuAmpcor updates: * added a README.md for installation/user guide/procedures * modified the cuDenseOffsets.py * expose more options from the CUDA/C++ program * add an option for varying gross offset input * clarify the parameter definitions * removed old SlcImage implementation and cublas dependence * modified cuSincOversampler * to be consistent with cpu version * fix an issue when the extraction of the search window is not around the center * added a debug mode to output intermediate results * enable cuda error checking for both Debug/Release build types * corrected the code to extract raw images when the correlation surface peak is close to edges * Move utf-8 decoding step inside cython extension The cython setters take python strings, but the getters return python bytes, so this makes the types match up. I went with regular python strings for the interface since they are more common at the python level, so the encoding/decoding is now an implementation detail of the cython extension. Contributed by lijun99, rtburns-jpl, vbrancat, mzzhong 2020-11-12 23:02:44 +00:00			`streams[ist]);`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00
Adding all files 2019-01-16 19:40:08 +00:00			`}`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00
Adding all files 2019-01-16 19:40:08 +00:00			`int nChunksDown = param->numberChunkDown;`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00			`int nChunksAcross = param->numberChunkAcross;`

PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`// report info`
			`std::cout << "Total number of windows (azimuth x range): "`
			`<< param->numberWindowDown << " x " << param->numberWindowAcross`
			`<< std::endl;`
			`std::cout << "to be processed in the number of chunks: "`
			`<< nChunksDown << " x " << nChunksAcross << std::endl;`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`// iterative over chunks down`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00			`for(int i = 0; i<nChunksDown; i++)`
Adding all files 2019-01-16 19:40:08 +00:00			`{`
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`std::cout << "Processing chunk (" << i <<", x" << ") out of " << nChunksDown << std::endl;`
			`// iterate over chunks across`
Adding all files 2019-01-16 19:40:08 +00:00			`for(int j=0; j<nChunksAcross; j+=param->nStreams)`
			`{`
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`// iterate over cuda streams to process chunks`
			`for(int ist = 0; ist < param->nStreams; ist++)`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00			`{`
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`int chunkIdxAcross = j+ist;`
			`if(chunkIdxAcross < nChunksAcross) {`
			`chunk[ist]->run(i, chunkIdxAcross);`
Adding all files 2019-01-16 19:40:08 +00:00			`}`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00			`}`
Adding all files 2019-01-16 19:40:08 +00:00			`}`
			`}`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`// wait all streams are done`
Adding all files 2019-01-16 19:40:08 +00:00			`cudaDeviceSynchronize();`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`// extraction of the run images to output images`
Adding all files 2019-01-16 19:40:08 +00:00			`cuArraysCopyExtract(offsetImageRun, offsetImage, make_int2(0,0), streams[0]);`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00			`cuArraysCopyExtract(snrImageRun, snrImage, make_int2(0,0), streams[0]);`
			`cuArraysCopyExtract(covImageRun, covImage, make_int2(0,0), streams[0]);`
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`// save outputs to files`
Adding all files 2019-01-16 19:40:08 +00:00			`offsetImage->outputToFile(param->offsetImageName, streams[0]);`
			`snrImage->outputToFile(param->snrImageName, streams[0]);`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00			`covImage->outputToFile(param->covImageName, streams[0]);`
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`// also save the gross offsets`
Adding all files 2019-01-16 19:40:08 +00:00			`outputGrossOffsets();`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00
			`// Delete arrays.`
Adding all files 2019-01-16 19:40:08 +00:00			`delete offsetImage;`
			`delete snrImage;`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00			`delete covImage;`

Adding all files 2019-01-16 19:40:08 +00:00			`delete offsetImageRun;`
			`delete snrImageRun;`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00			`delete covImageRun;`

Adding all files 2019-01-16 19:40:08 +00:00			`for (int ist=0; ist<param->nStreams; ist++)`
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`{`
			`checkCudaErrors(cudaStreamDestroy(streams[ist]));`
Adding all files 2019-01-16 19:40:08 +00:00			`delete chunk[ist];`
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`}`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00
diversity: replaced oppressive language with neutral definitions of the images that comprise an interferogram through the entire repository 2020-07-02 19:40:49 +00:00			`delete referenceImage;`
			`delete secondaryImage;`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00
			`}`
Adding all files 2019-01-16 19:40:08 +00:00
PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`/**`
			`* Output gross offset fields`
			`*/`
Adding all files 2019-01-16 19:40:08 +00:00			`void cuAmpcorController::outputGrossOffsets()`
			`{`
			`cuArrays<float2> *grossOffsets = new cuArrays<float2>(param->numberWindowDown, param->numberWindowAcross);`
			`grossOffsets->allocateHost();`
PyCuAmpcor: updated to the most recent version with gdal input 2019-11-20 00:59:49 +00:00
Adding all files 2019-01-16 19:40:08 +00:00			`for(int i=0; i< param->numberWindows; i++)`
			`grossOffsets->hostData[i] = make_float2(param->grossOffsetDown[i], param->grossOffsetAcross[i]);`
			`grossOffsets->outputHostToFile(param->grossOffsetImageName);`
			`delete grossOffsets;`
			`}`

PyCuAmpcor: code cleanup, add docstrings 2020-11-18 07:22:37 +00:00			`// end of file`