This is the WarpTransform accelerated function from Vitis Vision Open Source Library. More...

Collaboration diagram for WarpTransform:

Modules
	WarpTransform Testbench
	This is a subgroup of WarpTransform accelerated function with only testbench-related functions/classes.

	WarpTransform HLS
	This is a subgroup of WarpTransform accelerated function with only synthesizable (HLS) functions/classes.

	WarpTransform Host
	This is a subgroup of WarpTransform accelerated function with only host code software.

Files
file	config.h
	The configuration of a WarpTransform Example application (UDP or TCP)

file	warp_transform_host.cpp
	WarpTransform userspace application for cF (x86, ppc64).

file	xf_warp_transform_config.h
	The WarpTransform configuration header.

Macros
#define	CEIL(a, b) (((a) + (b-1)) / (b))

#define	FRAME_HEIGHT 32

#define	FRAME_WIDTH 32

#define	FRAME_INTERVAL (1000/30)

#define	PACK_SIZE 1024

#define	BUF_LEN 65540

#define	WRITE_OUTPUT_FILE

#define	TB_SIM_CFP_VITIS

#define	INPUT_TYPE_HOST CV_8UC1

#define	NET_TYPE udp

#define	DEBUG_LEVEL dbgLevelNone

#define	FRAME_TOTAL FRAME_HEIGHT * FRAME_WIDTH

#define	WARP_TRANSFORM_TOTAL FRAME_TOTAL + 8 * 2 + 5 * 8

#define	TOT_TRANSFERS CEIL(WARP_TRANSFORM_TOTAL, PACK_SIZE)

#define	tcp 0

#define	udp 1

#define	PY_WRAP_WARPTRANSFORM_NUMPI 0

#define	PY_WRAP_WARPTRANSFORM_FILENAME 1

#define	TRMAT_DIM2 3

#define	TRMAT_DIM1 2

#define	NUM_STORE_ROWS 256

#define	START_PROC 200

#define	INTERPOLATION 0

#define	TRANSFORM_TYPE 0

#define	XF_USE_URAM false

#define	NPC1 XF_NPPC1

#define	PTR_WIDTH 128

#define	TYPE XF_8UC1

#define	CH_TYPE XF_GRAY

#define	INPUT_PTR_WIDTH 8

#define	OUTPUT_PTR_WIDTH 64

#define	NPIX XF_NPPC1

#define	WIDTH FRAME_WIDTH

#define	HEIGHT FRAME_HEIGHT

#define	IMGSIZE FRAME_TOTAL

#define	BITS_PER_10GBITETHRNET_AXI_PACKET 64

#define	BYTES_PER_10GBITETHRNET_AXI_PACKET (BITS_PER_10GBITETHRNET_AXI_PACKET/8)

#define	IMG_PACKETS IMGSIZE/(BYTES_PER_10GBITETHRNET_AXI_PACKET)

#define	MIN_RX_LOOPS IMG_PACKETS*(BITS_PER_10GBITETHRNET_AXI_PACKET/INPUT_PTR_WIDTH)

#define	MIN_TX_LOOPS IMG_PACKETS*(BITS_PER_10GBITETHRNET_AXI_PACKET/OUTPUT_PTR_WIDTH)

#define	OUT_TYPE TYPE

Functions
void	delay (unsigned int mseconds)

void	print_cFpZoo (void)

void	resizeCropSquare (const cv::Mat &input, const cv::Mat &output, const cv::Size &dstSize, int interpolation=INTER_LINEAR)
	Resize an image and crop if necessary in order to keep a rectangle area in the middle of the image. More...

string	prepareWarpTransformCommand (unsigned int rows, unsigned int cols, unsigned int channels, float *transform_matrix)

int	main (int argc, char *argv[])

void	warptTransformAccelArray (ap_uint< 8 > img_in, float transform, ap_uint< 64 > *img_out, int rows, int cols)
	Top-level accelerated function of the WarptTransform Application with array I/F used only for simulation/TB purposes. More...

void	warpTransformAccelStream (hls::stream< ap_uint< 8 >> &img_in_axi_stream, hls::stream< ap_uint< 64 >> &img_out_axi_stream, int rows, int cols, float transform_matrix[9])
	Top-level accelerated function of the WarpTransform Application with array I/Fadd WARPTRANSFORM. More...

void	fakeWarpTransformAccelStream (hls::stream< ap_axiu< 8, 0, 0, 0 > > &img_in_axi_stream, hls::stream< ap_axiu< 64, 0, 0, 0 > > &img_out_axi_stream, unsigned int min_rx_loops, unsigned int min_tx_loops, float transform_matrix[9])

void	warp_transformAccelMem (membus_t img_inp, membus_t img_out, int rows, int cols, hls::stream< float > &sTxMatrix)
	Top-level accelerated function of the WarpTransform Application with memory mapped interfaces. More...

Detailed Description

This is the WarpTransform accelerated function from Vitis Vision Open Source Library.

Macro Definition Documentation

◆ BITS_PER_10GBITETHRNET_AXI_PACKET

#define BITS_PER_10GBITETHRNET_AXI_PACKET 64

Definition at line 121 of file xf_warp_transform_config.h.

◆ BUF_LEN

#define BUF_LEN 65540

Larger than maximum UDP packet size

Definition at line 55 of file config.h.

◆ BYTES_PER_10GBITETHRNET_AXI_PACKET

#define BYTES_PER_10GBITETHRNET_AXI_PACKET (BITS_PER_10GBITETHRNET_AXI_PACKET/8)

Definition at line 122 of file xf_warp_transform_config.h.

◆ CEIL

#define CEIL	(	a,
		b
	)	(((a) + (b-1)) / (b))

Ceiling function without using math.h

Definition at line 37 of file config.h.

◆ CH_TYPE

#define CH_TYPE XF_GRAY

Definition at line 102 of file xf_warp_transform_config.h.

◆ DEBUG_LEVEL

#define DEBUG_LEVEL dbgLevelNone

The level of debugging. 0->None, 1-> Light Debug, 2-> Medium Debug , 3-> Insane Debug

Definition at line 78 of file config.h.

◆ FRAME_HEIGHT

#define FRAME_HEIGHT 32

The maximum width of frame in pixels from 6x6 to 256x256 for debugging

Definition at line 43 of file config.h.

◆ FRAME_INTERVAL

#define FRAME_INTERVAL (1000/30)

Definition at line 48 of file config.h.

◆ FRAME_TOTAL

#define FRAME_TOTAL FRAME_HEIGHT * FRAME_WIDTH

Definition at line 82 of file config.h.

◆ FRAME_WIDTH

#define FRAME_WIDTH 32

The maximum height of frame in pixels

Definition at line 46 of file config.h.

◆ HEIGHT

#define HEIGHT FRAME_HEIGHT

Definition at line 117 of file xf_warp_transform_config.h.

◆ IMG_PACKETS

#define IMG_PACKETS IMGSIZE/(BYTES_PER_10GBITETHRNET_AXI_PACKET)

Definition at line 124 of file xf_warp_transform_config.h.

◆ IMGSIZE

#define IMGSIZE FRAME_TOTAL

Definition at line 119 of file xf_warp_transform_config.h.

◆ INPUT_PTR_WIDTH

#define INPUT_PTR_WIDTH 8

Definition at line 103 of file xf_warp_transform_config.h.

◆ INPUT_TYPE_HOST

#define INPUT_TYPE_HOST CV_8UC1

Keep it uncommented of you want the input to be from camera frames else, for images comment it For The OpenCV type fot th input image. TODO: We have to automatically fix it for every kernel

Definition at line 70 of file config.h.

◆ INTERPOLATION

#define INTERPOLATION 0

Definition at line 74 of file xf_warp_transform_config.h.

◆ MIN_RX_LOOPS

#define MIN_RX_LOOPS IMG_PACKETS*(BITS_PER_10GBITETHRNET_AXI_PACKET/INPUT_PTR_WIDTH)

Definition at line 126 of file xf_warp_transform_config.h.

◆ MIN_TX_LOOPS

#define MIN_TX_LOOPS IMG_PACKETS*(BITS_PER_10GBITETHRNET_AXI_PACKET/OUTPUT_PTR_WIDTH)

Definition at line 127 of file xf_warp_transform_config.h.

◆ NET_TYPE

#define NET_TYPE udp

The network socket type: tcp or udp

Definition at line 73 of file config.h.

◆ NPC1

#define NPC1 XF_NPPC1

Definition at line 82 of file xf_warp_transform_config.h.

◆ NPIX

#define NPIX XF_NPPC1

Definition at line 113 of file xf_warp_transform_config.h.

◆ NUM_STORE_ROWS

#define NUM_STORE_ROWS 256

Definition at line 69 of file xf_warp_transform_config.h.

◆ OUT_TYPE

#define OUT_TYPE TYPE

Definition at line 130 of file xf_warp_transform_config.h.

◆ OUTPUT_PTR_WIDTH

#define OUTPUT_PTR_WIDTH 64

Definition at line 104 of file xf_warp_transform_config.h.

◆ PACK_SIZE

#define PACK_SIZE 1024

This is our custom MTU. We must use a multiple of 8 (Bytes per transaction)! 1450 4086 udp pack size; note that OSX limits < 8100 bytes

Definition at line 52 of file config.h.

◆ PTR_WIDTH

#define PTR_WIDTH 128

Definition at line 83 of file xf_warp_transform_config.h.

◆ PY_WRAP_WARPTRANSFORM_FILENAME

#define PY_WRAP_WARPTRANSFORM_FILENAME 1

Definition at line 92 of file config.h.

◆ PY_WRAP_WARPTRANSFORM_NUMPI

#define PY_WRAP_WARPTRANSFORM_NUMPI 0

Definition at line 91 of file config.h.

◆ START_PROC

#define START_PROC 200

Definition at line 72 of file xf_warp_transform_config.h.

◆ TB_SIM_CFP_VITIS

#define TB_SIM_CFP_VITIS

If defined, images will be shown in pop-up windows
For HOST TB uncomment this. For normal host execution keep it commented

Definition at line 64 of file config.h.

◆ tcp

#define tcp 0

Definition at line 88 of file config.h.

◆ TOT_TRANSFERS

#define TOT_TRANSFERS CEIL(WARP_TRANSFORM_TOTAL, PACK_SIZE)

The total TxRx transfers for a predefined MTU=PACK_SIZE

Definition at line 86 of file config.h.

◆ TRANSFORM_TYPE

#define TRANSFORM_TYPE 0

Definition at line 77 of file xf_warp_transform_config.h.

◆ TRMAT_DIM1

#define TRMAT_DIM1 2

Definition at line 48 of file warp_transform_host.cpp.

◆ TRMAT_DIM2

#define TRMAT_DIM2 3

Definition at line 47 of file warp_transform_host.cpp.

◆ TYPE

#define TYPE XF_8UC1

Definition at line 97 of file xf_warp_transform_config.h.

◆ udp

#define udp 1

Definition at line 89 of file config.h.

◆ WARP_TRANSFORM_TOTAL

#define WARP_TRANSFORM_TOTAL FRAME_TOTAL + 8 * 2 + 5 * 8

Definition at line 83 of file config.h.

◆ WIDTH

#define WIDTH FRAME_WIDTH

Definition at line 116 of file xf_warp_transform_config.h.

◆ WRITE_OUTPUT_FILE

#define WRITE_OUTPUT_FILE

If defined, output images will be written

Definition at line 58 of file config.h.

◆ XF_USE_URAM

#define XF_USE_URAM false

Definition at line 78 of file xf_warp_transform_config.h.

Function Documentation

◆ delay()

void delay ( unsigned int mseconds )

Definition at line 60 of file warp_transform_host.cpp.

 {
     clock_t goal = mseconds + clock();
     while (goal > clock());
 }

Here is the call graph for this function:

◆ fakeWarpTransformAccelStream()

void fakeWarpTransformAccelStream	(	hls::stream< ap_axiu< 8, 0, 0, 0 > > &	img_in_axi_stream,
		hls::stream< ap_axiu< 64, 0, 0, 0 > > &	img_out_axi_stream,
		unsigned int	min_rx_loops,
		unsigned int	min_tx_loops,
		float	transform_matrix[9]
	)

Here is the caller graph for this function:

◆ main()

int main	(	int	argc,
		char *	argv[]
	)

Main testbench and user-application for WarpTransform on host. Client

Returns: O on success, 1 on fail

Definition at line 164 of file warp_transform_host.cpp.

                                   {
     if ((argc < 3) || (argc > 4)) { // Test for correct number of arguments
         cerr << "Usage: " << argv[0] << " <Server> <Server Port> <optional input image>\n";
         exit(1);
     }
 #endif // PY_WRAP
  
     //------------------------------------------------------
     //-- STEP-1 : Socket and variables definition
     //------------------------------------------------------
     
     #ifndef PY_WRAP
     assert ((argc == 3) || (argc == 4));
     string s_servAddress = argv[1]; // First arg: server address
     char *s_servPort = argv[2];
     #endif
  
     string servAddress = s_servAddress;
     unsigned short servPort;
     bool net_type = NET_TYPE;
     if (net_type == udp) {
     servPort = Socket::resolveService(s_servPort, "udp");
     }
     else if (net_type == tcp) {
     servPort = atoi(s_servPort);
     }
     else {
     cout << "ERROR: Invalid type of socket type provided: " << net_type  << " Choosed one of (tcp=0 or udp=1)" << endl;
     }    
     
     unsigned char buffer[BUF_LEN]; // Buffer for echo string
     unsigned int recvMsgSize; // Size of received message
     string input_string;
 #ifdef INPUT_FROM_CAMERA
     int input_num;
 #ifdef PY_WRAP
 #if PY_WRAP == PY_WRAP_WARPTRANSFORM_FILENAME
     input_num = atoi(input_str);
     input_string = "./cam"+to_string(input_num);
 #endif // PY_WRAP == PY_WRAP_WARPTRANSFORM_FILENAME
 #else // !PY_WRAP
     if (argc == 3) {
         input_num = 0;
     }
     else if (argc == 4) {
         input_num = atoi(argv[3]);
     }
     input_string = "./cam"+to_string(input_num);
 #endif // PY_WRAP    
 #else // !INPUT_FROM_CAMERA
 #ifdef PY_WRAP
 #if PY_WRAP == PY_WRAP_WARPTRANSFORM_FILENAME
     input_string.assign(input_str);
 #endif // PY_WRAP == PY_WRAP_WARPTRANSFORM_FILENAME    
 #else // !PY_WRAP
     if (argc == 3) {
         // Give a default image
         input_string.assign("../../../../../../ROLE/vision/hls/warp_transform/test/8x8.png");
     }
     else if (argc == 4) {
         input_string.assign(argv[3]);
     }
 #endif // PY_WRAP
 #endif // INPUT_FROM_CAMERA
     
    
 #if !defined(PY_WRAP) || (PY_WRAP == PY_WRAP_WARPTRANSFORM_FILENAME)
    
     // ksize: aperture linear size; it must be odd and greater than 1, for example: 3, 5, 7 ...
     // int ksize = WINDOW_SIZE ;
     // float identity_tx_mat [9] = {1,0,0,0,1,0,0,0,0};
     // float xtranslation_tx_mat [9] = {1,0,2,0,1,0,0,0,0};// 1 0 vx 0 1 vy 000
     // float ytranslation_tx_mat [9] = {1,0,0,0,1,2,0,0,0}; 
     // float reflection_tx_mat [9] = {-1,0,0,0,1,0,0,0,0};
     // float yscale_tx_mat [9] = {2,0,0,0,1,0,0,0,0}; //cx  0 0 0 cy 0 000
     // float xscale_tx_mat [9] = {1,0,0,0,2,0,0,0,0};
     // float rotation_30degree_tx_mat [9] = {0.87,-0.5,0,0.5,0.87,0,0,0,0}; //cos -sin 0 sin cos 0 000
     // float shearing_tx_mat [9] = {1,0.5,0,0,1,0,0,0,0}; //1 cx 0 cy 1 0 000
     float transformation_matrix_float [9] = {1.5,0,0,0,1.8,0,0,0,0};
     cv::Mat transformation_matrix(TRMAT_DIM1, TRMAT_DIM2, CV_32FC1, transformation_matrix_float);
     string out_img_file;
     string out_video_file;
     // Define the codec and create VideoWriter object.The output is stored in 'outcpp.avi' file. 
     //#ifdef PY_WRAP
     //out_video_file.assign(output_str);
     //#else // !PY_WRAP
     out_video_file.assign(input_string);
     out_video_file += "_fpga_video_out.avi";
     //#endif // PY_WRAP
 #if CV_MAJOR_VERSION < 4
     VideoWriter video(out_video_file,CV_FOURCC('M','J','P','G'),10, Size(FRAME_WIDTH,FRAME_HEIGHT));
 #else
     VideoWriter video(out_video_file,cv::VideoWriter::fourcc('M','J','P','G'),10, Size(FRAME_WIDTH,FRAME_HEIGHT));
 #endif
  
 #endif // #if !defined(PY_WRAP) || (PY_WRAP == PY_WRAP_WARPTRANSFORM_FILENAME) 
  
     print_cFpZoo();
     
     try {
           
         //------------------------------------------------------
         //-- STEP-2 : Initialize socket connection
         //------------------------------------------------------      
 #if NET_TYPE == udp
 #ifndef TB_SIM_CFP_VITIS
             UDPSocket sock(servPort); // NOTE: It is very important to set port here in order to call 
                                       // bind() in the UDPSocket constructor
 #else // TB_SIM_CFP_VITIS
             UDPSocket sock; // NOTE: In HOST TB the port is already binded by warp_transform_host_fwd_tb.cpp
 #endif // TB_SIM_CFP_VITIS
 #else // tcp
             TCPSocket sock(servAddress, servPort);
 #endif // udp/tcp
  
  
 #if !defined(PY_WRAP) || (PY_WRAP == PY_WRAP_WARPTRANSFORM_FILENAME)
  
  
             //------------------------------------------------------------------------------------
             //-- STEP-3 : Initialize a Greyscale OpenCV Mat either from image or from video/camera
             //------------------------------------------------------------------------------------
             Mat frame, send(FRAME_WIDTH, FRAME_HEIGHT, INPUT_TYPE_HOST, Scalar(0)), ocv_out_img;
             vector < uchar > encoded;
  
 #ifdef INPUT_FROM_CAMERA
  
         VideoCapture cap(input_num); // Grab the camera
         if (!cap.isOpened()) {
             cerr << "OpenCV Failed to open camera " + input_num << endl;
             exit(1);
         }
         
 #else // INPUT_FROM_CAMERA
  
         VideoCapture cap(input_string); // Grab the image
         if (!cap.isOpened()) {
             cerr << "OpenCV Failed to open file " + input_string << endl;
             exit(1);
         }
         
 #endif // INPUT_FROM_CAMERA
         std::string warptx_cmd = prepareWarpTransformCommand(FRAME_WIDTH, FRAME_HEIGHT, send.channels(), transformation_matrix_float);
         
         //frame = cv::imread(argv[3], cv::IMREAD_GRAYSCALE); // reading in the image in grey scale
         unsigned int num_frame = 0;
  
         while (1) {
             clock_t start_cycle_main = clock();
             cap >> frame;
             if (frame.empty()) break; // if input is an image, the loop will be executed once
             if(frame.size().width==0) continue; //simple integrity check; skip erroneous data...
             cout << " ___________________________________________________________________ " << endl;
             cout << "/                                                                   \\" << endl;
             cout << "INFO: Frame # " << ++num_frame << endl;
 #if CV_MAJOR_VERSION < 4
             cv::cvtColor(frame,frame,CV_BGR2GRAY);
 #else
             cv::cvtColor(frame,frame,cv::COLOR_BGR2GRAY);
 #endif
             resizeCropSquare(frame, send, Size(FRAME_WIDTH, FRAME_HEIGHT), INTER_LINEAR);
             if ((frame.cols != FRAME_WIDTH) || (frame.rows != FRAME_HEIGHT)) {
                 cout << "WARNING: Input frame was resized from " << frame.cols << "x" 
                         << frame.rows << " to " << send.cols << "x" << send.rows << endl;
             }
                 imwrite("testimg.png", frame);
  
             assert(send.total() == FRAME_WIDTH * FRAME_HEIGHT);
             // Ensure that the selection of MTU is a multiple of 8 (Bytes per transaction)
             assert(PACK_SIZE % 8 == 0);
  
 #ifdef SHOW_WINDOWS     
             namedWindow("host_send", CV_WINDOW_NORMAL);
             imshow("host_send", send);
  
 #endif // SHOW_WINDOWS
     
             // Ensure that the send Mat is in continuous memory space. Typically, imread or resize 
             // will return such a continuous Mat, but we should check it.
             assert(send.isContinuous());
  
             unsigned int send_total = send.total();
             unsigned int send_channels = send.channels();
             unsigned int warptx_cmd_size = warptx_cmd.length();
 #else // PY_WRAP == PY_WRAP_WARPTRANSFORM_NUMPI
             unsigned int send_total = (unsigned int)total_size +  warptx_cmd_size; //TBC!!!!!!!!!!!!!!!!!
             unsigned int send_channels = 1; // FIXME: It is ok only for 1-d array, i.e. CV_8UC1
             unsigned char * sendarr = input_img;
 #endif // #if !defined(PY_WRAP) || (PY_WRAP == PY_WRAP_WARPTRANSFORM_FILENAME)
  
             unsigned int total_pack  = 1 + (send_total * send_channels - 1 +  warptx_cmd_size) / PACK_SIZE;
             unsigned int total_bytes = total_pack * PACK_SIZE;
             unsigned int bytes_in_last_pack = send_total * send_channels +  warptx_cmd_size - (total_pack - 1) * PACK_SIZE;
             assert(total_pack == TOT_TRANSFERS);
  
             unsigned int total_pack_rx  = 1 + (send_total * send_channels - 1) / PACK_SIZE;
             unsigned int total_bytes_rx = total_pack_rx * PACK_SIZE;
             unsigned int bytes_in_last_pack_rx = send_total * send_channels - (total_pack_rx- 1) * PACK_SIZE;
  
             //unsigned char * longbuf = new unsigned char[PACK_SIZE * total_pack];
         unsigned char * longbuf = (unsigned char *) malloc (PACK_SIZE * total_pack_rx * sizeof (unsigned char));
  
             cout << "INFO: FPGA destination : " << servAddress << ":" << servPort << endl;
             cout << "INFO: Network socket   : " << ((NET_TYPE == tcp) ? "TCP" : "UDP") << endl;
             cout << "INFO: Total packets to send= " << total_pack << endl;
             cout << "INFO: Total packets to receive = " << total_pack_rx << endl;
             cout << "INFO: Total bytes to send   = " << send_total * send_channels +  warptx_cmd_size << endl;
             cout << "INFO: Total bytes to receive   = " << send_total * send_channels << endl;
             cout << "INFO: Total bytes in " << total_pack << " packets = "  << total_bytes << endl;
             cout << "INFO: Total bytes in " << total_pack_rx << " packets = "  << total_bytes_rx << endl;
             cout << "INFO: Bytes in last packet          = " << bytes_in_last_pack << endl;
             cout << "INFO: Bytes in last packet to receive    = " << bytes_in_last_pack_rx << endl;
             cout << "INFO: Packet size (custom MTU)      = " << PACK_SIZE << endl;
  
 #if !defined(PY_WRAP) || (PY_WRAP == PY_WRAP_WARPTRANSFORM_FILENAME)
         
             //--------------------------------------------------------
             //-- STEP-4 : RUN WARPTRANSFORM DETECTOR FROM OpenCV LIBRARY (SW)
             //--------------------------------------------------------
             clock_t start_cycle_warp_transform_sw = clock();
             ocv_out_img.create(send.rows, send.cols, INPUT_TYPE_HOST); // create memory for opencv output image
             ocv_ref(send, ocv_out_img, transformation_matrix);
             clock_t end_cycle_warp_transform_sw = clock();
             double duration_warp_transform_sw = (end_cycle_warp_transform_sw - start_cycle_warp_transform_sw) / 
                                             (double) CLOCKS_PER_SEC;
             cout << "INFO: SW exec. time:" << duration_warp_transform_sw << " seconds" << endl;
             cout << "INFO: Effective FPS SW:" << (1 / duration_warp_transform_sw) << " \tkbps:" << 
                     (PACK_SIZE * total_pack / duration_warp_transform_sw / 1024 * 8) << endl;
  
             //------------------------------------------------------
             //-- STEP-5 : RUN WARPTRANSFORM DETECTOR FROM cF (HW)
             //------------------------------------------------------
     
             //------------------------------------------------------
             //-- STEP-5.1 : Preparation
             //------------------------------------------------------
  
             // Anchor a pointer on cvMat raw data
             unsigned char * sendarr_img = send.isContinuous()? send.data: send.clone().data;
             // unsigned char * sendarr = send.isContinuous()? send.data: send.clone().data;
             // warptx_cmd = warptx_cmd.append(sendarr_img, send_total * send_channels);
             unsigned char * sendarr = (unsigned char *) malloc (send_total * send_channels +  warptx_cmd_size);
             memcpy(sendarr,warptx_cmd.c_str(), warptx_cmd_size);
             memcpy(sendarr+warptx_cmd_size,sendarr_img, send_total * send_channels);
             
 #endif // !defined(PY_WRAP) || (PY_WRAP == PY_WRAP_WARPTRANSFORM_FILENAME)
     
             clock_t start_cycle_warp_transform_hw = clock();
  
             //------------------------------------------------------
             //-- STEP-5.2 : TX Loop
             //------------------------------------------------------
             clock_t last_cycle_tx = clock();
             unsigned int sending_now = PACK_SIZE;
             for (unsigned int i = 0; i < total_pack; i++) {
                 if ( i == total_pack - 1 ) {
                     sending_now = bytes_in_last_pack;
                 }
                 #if NET_TYPE == udp
                 sock.sendTo( & sendarr[i * PACK_SIZE], sending_now, servAddress, servPort);
                 #else
                 sock.send( & sendarr[i * PACK_SIZE], sending_now);
                 #endif
                 //delay(500);  
             }
             
             clock_t next_cycle_tx = clock();
             double duration_tx = (next_cycle_tx - last_cycle_tx) / (double) CLOCKS_PER_SEC;
             cout << "INFO: Effective FPS TX:" << (1 / duration_tx) << " \tkbps:" << (PACK_SIZE * 
                  total_pack / duration_tx / 1024 * 8) << endl;
             last_cycle_tx = next_cycle_tx;
         
         
             //------------------------------------------------------
             //-- STEP-5.3 : RX Loop
             //------------------------------------------------------    
             clock_t last_cycle_rx = clock();
             unsigned int receiving_now = PACK_SIZE;
             cout << "INFO: Expecting length of packs:" << total_pack_rx << " from " <<  servAddress << ":" << servPort << endl;
             //unsigned char * longbuf = new unsigned char[PACK_SIZE * total_pack];
             unsigned int loopi=0;
             for (unsigned int i = 0; i < send_total; ) {
                 //cout << "DEBUG: i=" << i << ", loopi=" << loopi++ << endl;
                 //if ( i == total_pack - 1 ) {
                 //    receiving_now = bytes_in_last_pack;
                 //}
                 #if NET_TYPE == udp                
                 recvMsgSize = sock.recvFrom(buffer, BUF_LEN, servAddress, servPort);
                 #else
                 recvMsgSize = sock.recv(buffer, BUF_LEN);
                 #endif
                 if (recvMsgSize != receiving_now) {
                     cerr << "WARNING: at i=" << i << " received unexpected size pack:" << recvMsgSize << ". Expected: " << 
                             receiving_now << endl;
                     //continue;
                 }
                 memcpy( & longbuf[i], buffer, recvMsgSize);
                 //cout << "DEBUG: i=" << i << " recvMsgSize=" << recvMsgSize << endl;
                 i += recvMsgSize;
                 //delay(500);
             }
             cout << "INFO: Received packet from " << servAddress << ":" << servPort << endl;
  
             clock_t next_cycle_rx = clock();
             double duration_rx = (next_cycle_rx - last_cycle_rx) / (double) CLOCKS_PER_SEC;
             cout << "INFO: Effective FPS RX:" << (1 / duration_rx) << " \tkbps:" << (PACK_SIZE * 
                     total_pack_rx / duration_rx / 1024 * 8) << endl;
             last_cycle_rx = next_cycle_rx;
  
             clock_t end_cycle_warp_transform_hw = next_cycle_rx;
  
             double duration_warp_transform_hw = (end_cycle_warp_transform_hw - start_cycle_warp_transform_hw) / 
                                                 (double) CLOCKS_PER_SEC;
             cout << "INFO: HW exec. time:" << duration_warp_transform_hw << " seconds" << endl;
             cout << "INFO: Effective FPS HW:" << (1 / duration_warp_transform_hw) << " \tkbps:" << 
                     (PACK_SIZE * total_pack / duration_warp_transform_hw / 1024 * 8) << endl;
                     
 #if !defined(PY_WRAP) || (PY_WRAP == PY_WRAP_WARPTRANSFORM_FILENAME)
  
             frame = cv::Mat(FRAME_HEIGHT, FRAME_WIDTH, INPUT_TYPE_HOST, longbuf); // OR vec.data() instead of ptr
             if (frame.size().width == 0) {
                 cerr << "receive failure!" << endl;
                 continue;
             }
 #ifdef SHOW_WINDOWS            
             namedWindow("host_recv", CV_WINDOW_NORMAL);
             imshow("host_recv", frame);
 #endif
  
             //------------------------------------------------------
             //-- STEP-6 : Write output files and show in windows
             //------------------------------------------------------
  
             ostringstream oss;
 //            oss << "cFp_Vitis E2E:" << "INFO: Effective FPS HW:" << (1 / duration_warp_transform_hw) << 
 //                   " \tkbps:" << (PACK_SIZE * total_pack / duration_warp_transform_hw / 1024 * 8);
             string windowName = "cFp_Vitis End2End"; //oss.str();
  
             //moveWindow(windowName, 0, 0);
 #ifdef WRITE_OUTPUT_FILE
             if (num_frame == 1) {
                 out_img_file.assign(input_string);
                 out_img_file += "_fpga_image_out_frame_" + to_string(num_frame) + ".png";
 #if defined(PY_WRAP) && (PY_WRAP == PY_WRAP_WARPTRANSFORM_FILENAME)
  
                 if (!strcpy(output_img_str, &out_img_file[0])) {
                     cerr << "ERROR: Cannot write to output image string." << endl;
                 }
 #endif // defined(PY_WRAP) && (PY_WRAP == PY_WRAP_WARPTRANSFORM_FILENAME)
                 cout << "INFO: The output image file is stored at : " << out_img_file << endl; 
                 // We save the image received from network after being processed by WarpTransform HW or HOST TB
                 imwrite(out_img_file, frame);
             }
             else if (num_frame > 1) {
                 // If the frame is empty, break immediately
                 if (frame.empty()) {
                     break;
                 }
                 cout << "INFO: The output video file is stored at  : " << out_video_file << endl;
                 Mat tovideo;
                 if (frame.channels() != 1) {
                     tovideo = frame;
                 }
                 else {
                     cvtColor(frame, tovideo, COLOR_GRAY2BGR);        
                 }
                 video.write(tovideo);
             }
 #endif // WRITE_OUTPUT_FILE
             waitKey(FRAME_INTERVAL);
             double duration_main = (clock() - start_cycle_main) / (double) CLOCKS_PER_SEC;
             cout << "INFO: Effective FPS E2E:" << (1 / duration_main) << endl;
             cout << "\\___________________________________________________________________/" << endl
             << endl;
             //delete(longbuf);
         free (longbuf);
         } // while loop
     
         // When everything done, release the video capture and write object
         cap.release();
         video.release();
  
         // Closes all the windows
         destroyAllWindows();
  
 #else  // !defined(PY_WRAP) || (PY_WRAP == PY_WRAP_WARPTRANSFORM_FILENAME)
         //output_img = longbuf;
         memcpy( output_img, longbuf, total_size);
     free(longbuf);
 #endif // !defined(PY_WRAP) || (PY_WRAP == PY_WRAP_WARPTRANSFORM_FILENAME)
  
         // Destructor closes the socket
     } catch (SocketException & e) {
         cerr << e.what() << endl;
         exit(1);
     }
     
 #ifndef PY_WRAP
     return 0;
 #endif
 }

◆ prepareWarpTransformCommand()

string prepareWarpTransformCommand	(	unsigned int	rows,
		unsigned int	cols,
		unsigned int	channels,
		float *	transform_matrix
	)

Definition at line 103 of file warp_transform_host.cpp.

                                                                                                                         {
     string out;
     unsigned int bytes_per_line = 8;
     char tx_cmd [bytes_per_line];
     char img_cmd [bytes_per_line];
     char value_cmd[bytes_per_line];
  
     //init tx and img cmd
     for (unsigned int k = 0; k < bytes_per_line; k++) {
        value_cmd[k]    = (char)0;
         if (k != 0) {
             tx_cmd[k] = (char)0;
             img_cmd[k] = (char)0;
         }
         else {
             tx_cmd[k] = (char)1; 
             img_cmd[k] = (char)2;
         }
      }
     out = out.append(tx_cmd,bytes_per_line);
  
     //dump the even elements of the tx matrix
     int off = 4;
     for (int i = 0; i < 8; i++)
     {
         memcpy(value_cmd+off, (float*)transform_matrix+i, 4);
         off += 4;
         off = off % bytes_per_line;
         if (i%2 && i!=0)
         {
             //dump matrix
             out = out.append(value_cmd,bytes_per_line);
         }
     }
     //dump last value
     unsigned int zero_constant = 0;
     memcpy(value_cmd, (char*)transform_matrix+8, 4);
     memcpy(value_cmd, (char*)&zero_constant, 4);
     out = out.append(value_cmd,bytes_per_line);
     //creating img mat cmd
     memcpy(img_cmd+6, (char*)&rows, 2);
     memcpy(img_cmd+4, (char*)&cols, 2);
     img_cmd[1]=channels;
     out = out.append(img_cmd,bytes_per_line);
     return string(out);
 }

◆ print_cFpZoo()

void print_cFpZoo ( void )

Definition at line 66 of file warp_transform_host.cpp.

 {
         cout <<  "                                                          " << endl;
     cout <<  "...build with:                                            " << endl;
     cout <<  " ██████╗███████╗██████╗    ███████╗ ██████╗  ██████╗      " << endl;
     cout <<  "██╔════╝██╔════╝██╔══██╗   ╚══███╔╝██╔═══██╗██╔═══██╗     " << endl;
     cout <<  "██║     █████╗  ██████╔╝     ███╔╝ ██║   ██║██║   ██║     " << endl;
     cout <<  "██║     ██╔══╝  ██╔═══╝     ███╔╝  ██║   ██║██║   ██║     " << endl;
     cout <<  "╚██████╗██║     ██║███████╗███████╗╚██████╔╝╚██████╔╝     " << endl;
     cout <<  " ╚═════╝╚═╝     ╚═╝╚══════╝╚══════╝ ╚═════╝  ╚═════╝      " << endl;
     cout <<  "A cloudFPGA project from IBM ZRL                    v1.0  " << endl;
     cout <<  "Quantitative Finance Monte-Carlo European Pricing Engine  " << endl;
 }

◆ resizeCropSquare()

void resizeCropSquare	(	const cv::Mat &	input,
		const cv::Mat &	output,
		const cv::Size &	dstSize,
		int	interpolation = `INTER_LINEAR`
	)

Resize an image and crop if necessary in order to keep a rectangle area in the middle of the image.

Parameters

[in]	input	A pointer to the cv::Mat input image
[out]	output	A pointer to the cv::Mat output image
[in]	Size	A pointer to the cv::Size of the output image (width, height)
[in]	interpolation	Enumerator for interpolation algorithm (imgproc.hpp)

Returns: Nothing.

Definition at line 91 of file warp_transform_host.cpp.

 {
     int h = input.rows;
     int w = input.cols;
     int min_size = min(h, w);
     int x = w/2-min_size/2;
     int y = h/2-min_size/2;
     // printf("w=%d, h=%d, min_size=%d, x=%d, y=%d, width=%d, height=%d\n", w, h, min_size, x, y, width, height);
     cv::Mat crop_img = input(Rect(x, y, min_size, min_size));
     resize(crop_img, output, Size(dstSize.width, dstSize.height), 0, 0, interpolation);
 }

◆ warp_transformAccelMem()

void warp_transformAccelMem	(	membus_t *	img_inp,
		membus_t *	img_out,
		int	rows,
		int	cols,
		hls::stream< float > &	sTxMatrix
	)

Top-level accelerated function of the WarpTransform Application with memory mapped interfaces.

Returns: Nothing.

Definition at line 222 of file xf_warp_transform_accel.cpp.

                               {
     // clang-format on
     #pragma  HLS INLINE off
  
     xf::cv::Mat<TYPE, HEIGHT, WIDTH, NPIX> imgInput(rows, cols);
     // clang-format off
     #pragma HLS stream variable=imgInput.data depth=4
     // clang-format on
  
     #ifndef FAKE_WarpTransform
     xf::cv::Mat<TYPE, HEIGHT, WIDTH, NPIX> imgOutput(rows, cols);
     // clang-format off
     #pragma HLS stream variable=imgOutput.data depth=4
     // clang-format on
     #endif
     
     // clang-format off
     #pragma HLS DATAFLOW
     // clang-format on
  
     // Copy transform data from global memory to local memory:
     static float transform_matrix[TRANSFORM_MATRIX_DIM];
  
     //prepare the tx matrix
     setUpTxMatrixFromStream(transform_matrix,sTxMatrix );
   
     // Feed a cv matrix from ddr memory
     xf::cv::Array2xfMat<MEMDW_512, XF_8UC1, HEIGHT, WIDTH, NPIX>(img_inp, imgInput);
     
     #ifdef FAKE_WarpTransform
     // Feed ddr memory from a cv matrix
     xf::cv::xfMat2Array<MEMDW_512, XF_8UC1, HEIGHT, WIDTH, NPIX>(imgInput, img_out);
     #else
     
     // Run xfOpenCV kernel:
     xf::cv::warpTransform<NUM_STORE_ROWS, START_PROC, TRANSFORM_TYPE, INTERPOLATION, TYPE, HEIGHT, WIDTH, NPC1,
                           XF_USE_URAM>(imgInput, imgOutput, transform_matrix);
  
     // Feed ddr memory from a cv matrix
     xf::cv::xfMat2Array<MEMDW_512, XF_8UC1, HEIGHT, WIDTH, NPIX>(imgOutput, img_out);    
     #endif
     
     
 }

Here is the call graph for this function:

Here is the caller graph for this function:

◆ warpTransformAccelStream()

void warpTransformAccelStream	(	hls::stream< ap_uint< 8 >> &	img_in_axi_stream,
		hls::stream< ap_uint< 64 >> &	img_out_axi_stream,
		int	rows,
		int	cols,
		float	transform_matrix[9]
	)

Top-level accelerated function of the WarpTransform Application with array I/Fadd WARPTRANSFORM.

Returns: Nothing.

Definition at line 129 of file xf_warp_transform_accel.cpp.

                                                   {
     // clang-format on
     #pragma  HLS INLINE off
  
     xf::cv::Mat<TYPE, HEIGHT, WIDTH, NPIX> imgInput(rows, cols);
     // clang-format off
     #pragma HLS stream variable=imgInput.data depth=2
     // clang-format on
  
     xf::cv::Mat<TYPE, HEIGHT, WIDTH, NPIX> imgOutput(rows, cols);
     // clang-format off
     #pragma HLS stream variable=imgOutput.data depth=2
     // clang-format on
  
     // clang-format off
     #pragma HLS DATAFLOW
     // clang-format on
     //FIXME: not static matrix
     //float transform_matrix[9]={1.5,0,0,0,1.8,0,0,0,0};
     // float transform_matrix[9]={0.87,-0.5,0,0.5,0.87,0,0,0,1};
  
     accel_utils accel_utils_obj;
     
     int dstMat_cols_align_npc = ((imgInput.cols + (NPIX - 1)) >> XF_BITSHIFT(NPIX)) << XF_BITSHIFT(NPIX);
  
     accel_utils_obj.hlsStrm2xfMat<INPUT_PTR_WIDTH, TYPE, HEIGHT, WIDTH, NPIX, (HEIGHT * WIDTH) / NPIX>(img_in_axi_stream, imgInput, dstMat_cols_align_npc);
     
     // Run xfOpenCV kernel:
     xf::cv::warpTransform<NUM_STORE_ROWS, START_PROC, TRANSFORM_TYPE, INTERPOLATION, TYPE, HEIGHT, WIDTH, NPC1,
                           XF_USE_URAM>(imgInput, imgOutput, transform_matrix);  
     
     int srcMat_cols_align_npc = ((imgOutput.cols + (NPIX - 1)) >> XF_BITSHIFT(NPIX)) << XF_BITSHIFT(NPIX);
     
     accel_utils_obj.xfMat2hlsStrm<OUTPUT_PTR_WIDTH, TYPE, HEIGHT, WIDTH, NPIX, HEIGHT*((WIDTH + NPIX - 1) / NPIX)>(imgOutput, img_out_axi_stream,
                                                                                         srcMat_cols_align_npc);    
 }

Here is the caller graph for this function:

◆ warptTransformAccelArray()

void warptTransformAccelArray	(	ap_uint< 8 > *	img_in,
		float *	transform,
		ap_uint< 64 > *	img_out,
		int	rows,
		int	cols
	)

Top-level accelerated function of the WarptTransform Application with array I/F used only for simulation/TB purposes.

Returns: Nothing.

Definition at line 83 of file xf_warp_transform_accel.cpp.

                                                                                                                 {   
     const int pROWS = HEIGHT;
     const int pCOLS = WIDTH;
     const int pNPC1 = NPIX;
  
     xf::cv::Mat<XF_8UC1, HEIGHT, WIDTH, NPIX> imgInput(rows, cols);
 // clang-format off
     #pragma HLS stream variable=imgInput.data depth=2
     // clang-format on
     xf::cv::Mat<XF_8UC1, HEIGHT, WIDTH, NPIX> imgOutput(rows, cols);
 // clang-format off
     #pragma HLS stream variable=imgOutput.data depth=2
 // clang-format on
  
 // clang-format off
     #pragma HLS DATAFLOW
     // clang-format on
  
     // Copy transform data from global memory to local memory:
     float transform_matrix[9];
  
     for (unsigned int i = 0; i < 9; ++i) {
 // clang-format off
         #pragma HLS PIPELINE
         // clang-format on
         transform_matrix[i] = transform[i];
     }
  
     xf::cv::Array2xfMat<INPUT_PTR_WIDTH, TYPE, HEIGHT, WIDTH, NPC1>(img_in, imgInput);
     xf::cv::warpTransform<NUM_STORE_ROWS, START_PROC, TRANSFORM_TYPE, INTERPOLATION, TYPE, HEIGHT, WIDTH, NPC1,
                           XF_USE_URAM>(imgInput, imgOutput, transform_matrix);  
     xf::cv::xfMat2Array<OUTPUT_PTR_WIDTH, XF_8UC1, HEIGHT, WIDTH, NPIX>(imgOutput, img_out);
 }

Here is the caller graph for this function:

Modules

Files

Macros

Functions

Detailed Description

Macro Definition Documentation

◆ BITS_PER_10GBITETHRNET_AXI_PACKET

◆ BUF_LEN

◆ BYTES_PER_10GBITETHRNET_AXI_PACKET

◆ CEIL

◆ CH_TYPE

◆ DEBUG_LEVEL

◆ FRAME_HEIGHT

◆ FRAME_INTERVAL

◆ FRAME_TOTAL

◆ FRAME_WIDTH

◆ HEIGHT

◆ IMG_PACKETS

◆ IMGSIZE

◆ INPUT_PTR_WIDTH

◆ INPUT_TYPE_HOST

◆ INTERPOLATION

◆ MIN_RX_LOOPS

◆ MIN_TX_LOOPS

◆ NET_TYPE

◆ NPC1

◆ NPIX

◆ NUM_STORE_ROWS

◆ OUT_TYPE

◆ OUTPUT_PTR_WIDTH

◆ PACK_SIZE

◆ PTR_WIDTH

◆ PY_WRAP_WARPTRANSFORM_FILENAME

◆ PY_WRAP_WARPTRANSFORM_NUMPI

◆ START_PROC

◆ TB_SIM_CFP_VITIS

◆ tcp

◆ TOT_TRANSFERS

◆ TRANSFORM_TYPE

◆ TRMAT_DIM1

◆ TRMAT_DIM2

◆ TYPE

◆ udp

◆ WARP_TRANSFORM_TOTAL

◆ WIDTH

◆ WRITE_OUTPUT_FILE

◆ XF_USE_URAM

Function Documentation

◆ delay()

◆ fakeWarpTransformAccelStream()

◆ main()

◆ prepareWarpTransformCommand()

◆ print_cFpZoo()

◆ resizeCropSquare()

◆ warp_transformAccelMem()

◆ warpTransformAccelStream()

◆ warptTransformAccelArray()