Dox/xf__warp__transform__accel_8cpp_source.html

 #include "../include/xf_warp_transform_config.h"

 #include <iostream>                     // For cout and cerr


 using namespace std;


 //{0.87,−0.5,0,0.5,0.87,0,0,0,1}


 void setUpTxMatrixFromStream(

   float transform_matrix[TRANSFORM_MATRIX_DIM],

   hls::stream<float> &sTxMatrix

   ){


     if(!sTxMatrix.empty()){

       for(int i=0; i<TRANSFORM_MATRIX_DIM; i++){

         #pragma HLS PIPELINE

         transform_matrix[i] = sTxMatrix.read();

       }

     }


 }


 void warptTransformAccelArray(

     ap_uint<INPUT_PTR_WIDTH>* img_in, float* transform, ap_uint<OUTPUT_PTR_WIDTH>* img_out, int rows, int cols) {

     const int pROWS = HEIGHT;

     const int pCOLS = WIDTH;

     const int pNPC1 = NPIX;


     xf::cv::Mat<XF_8UC1, HEIGHT, WIDTH, NPIX> imgInput(rows, cols);

 // clang-format off

     #pragma HLS stream variable=imgInput.data depth=2

     // clang-format on

     xf::cv::Mat<XF_8UC1, HEIGHT, WIDTH, NPIX> imgOutput(rows, cols);

 // clang-format off

     #pragma HLS stream variable=imgOutput.data depth=2

 // clang-format on


 // clang-format off

     #pragma HLS DATAFLOW

     // clang-format on


     // Copy transform data from global memory to local memory:

     float transform_matrix[9];


     for (unsigned int i = 0; i < 9; ++i) {

 // clang-format off

         #pragma HLS PIPELINE

         // clang-format on

         transform_matrix[i] = transform[i];

     }


     xf::cv::Array2xfMat<INPUT_PTR_WIDTH, TYPE, HEIGHT, WIDTH, NPC1>(img_in, imgInput);

     xf::cv::warpTransform<NUM_STORE_ROWS, START_PROC, TRANSFORM_TYPE, INTERPOLATION, TYPE, HEIGHT, WIDTH, NPC1,

                           XF_USE_URAM>(imgInput, imgOutput, transform_matrix);

     xf::cv::xfMat2Array<OUTPUT_PTR_WIDTH, XF_8UC1, HEIGHT, WIDTH, NPIX>(imgOutput, img_out);

 }


 #ifndef FAKE_WarpTransform


 //extern "C" {

 void warpTransformAccelStream(

     hls::stream<ap_uint<INPUT_PTR_WIDTH>>& img_in_axi_stream,

     hls::stream<ap_uint<OUTPUT_PTR_WIDTH>>& img_out_axi_stream,

     int rows, int cols,

     float transform_matrix[TRANSFORM_MATRIX_DIM]) {

     // clang-format on

     #pragma  HLS INLINE off


     xf::cv::Mat<TYPE, HEIGHT, WIDTH, NPIX> imgInput(rows, cols);

     // clang-format off

     #pragma HLS stream variable=imgInput.data depth=2

     // clang-format on


     xf::cv::Mat<TYPE, HEIGHT, WIDTH, NPIX> imgOutput(rows, cols);

     // clang-format off

     #pragma HLS stream variable=imgOutput.data depth=2

     // clang-format on


     // clang-format off

     #pragma HLS DATAFLOW

     // clang-format on

     //FIXME: not static matrix

     //float transform_matrix[9]={1.5,0,0,0,1.8,0,0,0,0};

     // float transform_matrix[9]={0.87,-0.5,0,0.5,0.87,0,0,0,1};


     accel_utils accel_utils_obj;


     int dstMat_cols_align_npc = ((imgInput.cols + (NPIX - 1)) >> XF_BITSHIFT(NPIX)) << XF_BITSHIFT(NPIX);


     accel_utils_obj.hlsStrm2xfMat<INPUT_PTR_WIDTH, TYPE, HEIGHT, WIDTH, NPIX, (HEIGHT * WIDTH) / NPIX>(img_in_axi_stream, imgInput, dstMat_cols_align_npc);


     // Run xfOpenCV kernel:

     xf::cv::warpTransform<NUM_STORE_ROWS, START_PROC, TRANSFORM_TYPE, INTERPOLATION, TYPE, HEIGHT, WIDTH, NPC1,

                           XF_USE_URAM>(imgInput, imgOutput, transform_matrix);


     int srcMat_cols_align_npc = ((imgOutput.cols + (NPIX - 1)) >> XF_BITSHIFT(NPIX)) << XF_BITSHIFT(NPIX);


     accel_utils_obj.xfMat2hlsStrm<OUTPUT_PTR_WIDTH, TYPE, HEIGHT, WIDTH, NPIX, HEIGHT*((WIDTH + NPIX - 1) / NPIX)>(imgOutput, img_out_axi_stream,

                                                                                         srcMat_cols_align_npc);

 }


 #else // FAKE_WarpTransform


 //extern "C" {

 void fakeWarpTransformAccelStream(

     hls::stream<ap_axiu<INPUT_PTR_WIDTH, 0, 0, 0> >& img_in_axi_stream,

     hls::stream<ap_axiu<OUTPUT_PTR_WIDTH, 0, 0, 0> >& img_out_axi_stream,

     unsigned int min_rx_loops,

     unsigned int min_tx_loops,

     float transform_matrix[TRANSFORM_MATRIX_DIM]) {


   #pragma  HLS INLINE off


   ap_axiu<INPUT_PTR_WIDTH, 0, 0, 0> tmp_in;

   ap_axiu<OUTPUT_PTR_WIDTH, 0, 0, 0> tmp_out;

   for (unsigned int i=0, j=0, k=0; k < 5 * (min_rx_loops + min_tx_loops); k++) {

     cout << "Consuming input...i=" << i << endl;

     if (!img_in_axi_stream.empty() && (i < min_rx_loops)) {

       tmp_in = img_in_axi_stream.read();

       i++;

     }


     tmp_out.data = tmp_in.data; // known silent dirty casting here when INPUT_PTR_WIDTH != OUTPUT_PTR_WIDTH

     cout << "Filling output...j=" << j << endl;

     if (!(img_out_axi_stream.full()) && (j < min_tx_loops)) {

       img_out_axi_stream.write(tmp_out);

       j++;

     }

     //if ((img_out_axi_stream.full()) || (i == min_tx_loops)) {

     if (j == min_tx_loops) {

       cout << "Full" << endl;

       //break;

     }

   }

 }


 #endif // FAKE_WarpTransform


 //extern "C" {

 void warp_transformAccelMem(membus_t* img_inp,

                             membus_t* img_out,

                             // membus_t* img_out2,

                             int rows, int cols,

                             // float transform_mat[TRANSFORM_MATRIX_DIM]

                             hls::stream<float> &sTxMatrix

                             ) {

     // clang-format on

     #pragma  HLS INLINE off


     xf::cv::Mat<TYPE, HEIGHT, WIDTH, NPIX> imgInput(rows, cols);

     // clang-format off

     #pragma HLS stream variable=imgInput.data depth=4

     // clang-format on


     #ifndef FAKE_WarpTransform

     xf::cv::Mat<TYPE, HEIGHT, WIDTH, NPIX> imgOutput(rows, cols);

     // clang-format off

     #pragma HLS stream variable=imgOutput.data depth=4

     // clang-format on

     #endif


     // clang-format off

     #pragma HLS DATAFLOW

     // clang-format on


     // Copy transform data from global memory to local memory:

     static float transform_matrix[TRANSFORM_MATRIX_DIM];


     //prepare the tx matrix

     setUpTxMatrixFromStream(transform_matrix,sTxMatrix );


     // Feed a cv matrix from ddr memory

     xf::cv::Array2xfMat<MEMDW_512, XF_8UC1, HEIGHT, WIDTH, NPIX>(img_inp, imgInput);


     #ifdef FAKE_WarpTransform

     // Feed ddr memory from a cv matrix

     xf::cv::xfMat2Array<MEMDW_512, XF_8UC1, HEIGHT, WIDTH, NPIX>(imgInput, img_out);

     #else


     // Run xfOpenCV kernel:

     xf::cv::warpTransform<NUM_STORE_ROWS, START_PROC, TRANSFORM_TYPE, INTERPOLATION, TYPE, HEIGHT, WIDTH, NPC1,

                           XF_USE_URAM>(imgInput, imgOutput, transform_matrix);


     // Feed ddr memory from a cv matrix

     xf::cv::xfMat2Array<MEMDW_512, XF_8UC1, HEIGHT, WIDTH, NPIX>(imgOutput, img_out);

     #endif


 }


XF_USE_URAM
#define XF_USE_URAM
Definition: xf_config_params.h:41

NPC1
#define NPC1
Definition: xf_gammacorrection_config.h:43

WIDTH
#define WIDTH
Definition: xf_gammacorrection_config.h:64

NPIX
#define NPIX
Definition: xf_gammacorrection_config.h:61

HEIGHT
#define HEIGHT
Definition: xf_gammacorrection_config.h:65

INPUT_PTR_WIDTH
#define INPUT_PTR_WIDTH
Definition: mceuropeanengine.hpp:71

OUTPUT_PTR_WIDTH
#define OUTPUT_PTR_WIDTH
Definition: mceuropeanengine.hpp:75

TYPE
#define TYPE
Definition: xf_median_blur_config.h:89

membus_t
membus_512_t membus_t
Definition: memtest.hpp:92

TRANSFORM_MATRIX_DIM
#define TRANSFORM_MATRIX_DIM
Definition: warp_transform.hpp:80

warp_transformAccelMem
void warp_transformAccelMem(membus_t *img_inp, membus_t *img_out, int rows, int cols, hls::stream< float > &sTxMatrix)
Top-level accelerated function of the WarpTransform Application with memory mapped interfaces.
Definition: xf_warp_transform_accel.cpp:222

setUpTxMatrixFromStream
void setUpTxMatrixFromStream(float transform_matrix[9], hls::stream< float > &sTxMatrix)
Definition: xf_warp_transform_accel.cpp:61

warpTransformAccelStream
void warpTransformAccelStream(hls::stream< ap_uint< 8 >> &img_in_axi_stream, hls::stream< ap_uint< 64 >> &img_out_axi_stream, int rows, int cols, float transform_matrix[9])
Top-level accelerated function of the WarpTransform Application with array I/Fadd WARPTRANSFORM.
Definition: xf_warp_transform_accel.cpp:129

warptTransformAccelArray
void warptTransformAccelArray(ap_uint< 8 > *img_in, float *transform, ap_uint< 64 > *img_out, int rows, int cols)
Top-level accelerated function of the WarptTransform Application with array I/F used only for simulat...
Definition: xf_warp_transform_accel.cpp:83

TRANSFORM_TYPE
#define TRANSFORM_TYPE
Definition: xf_warp_transform_config.h:77

START_PROC
#define START_PROC
Definition: xf_warp_transform_config.h:72

fakeWarpTransformAccelStream
void fakeWarpTransformAccelStream(hls::stream< ap_axiu< 8, 0, 0, 0 > > &img_in_axi_stream, hls::stream< ap_axiu< 64, 0, 0, 0 > > &img_out_axi_stream, unsigned int min_rx_loops, unsigned int min_tx_loops, float transform_matrix[9])

INTERPOLATION
#define INTERPOLATION
Definition: xf_warp_transform_config.h:74

NUM_STORE_ROWS
#define NUM_STORE_ROWS
Definition: xf_warp_transform_config.h:69

test_harris_standalone.stream
stream
Definition: test_harris_standalone.py:48

test_harris_standalone.rows
rows
Definition: test_harris_standalone.py:167

test_harris_standalone.cols
cols
Definition: test_harris_standalone.py:167