.. _program_listing_file__tmp_ws_src_vitis_common_include_imgproc_xf_accumulate_squared.hpp: Program Listing for File xf_accumulate_squared.hpp ================================================== |exhale_lsh| :ref:`Return to documentation for file ` (``/tmp/ws/src/vitis_common/include/imgproc/xf_accumulate_squared.hpp``) .. |exhale_lsh| unicode:: U+021B0 .. UPWARDS ARROW WITH TIP LEFTWARDS .. code-block:: cpp /* * Copyright 2019 Xilinx, Inc. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ #ifndef _XF_ACCUMULATE_SQUARED_HPP_ #define _XF_ACCUMULATE_SQUARED_HPP_ #include "hls_stream.h" #include "../common/xf_common.hpp" #ifndef XF_IN_STEP #define XF_IN_STEP 8 #endif #ifndef XF_OUT_STEP #define XF_OUT_STEP 16 #endif namespace xf { namespace cv { template int AcuumulateSquaredKernel(xf::cv::Mat& src1, xf::cv::Mat& src2, xf::cv::Mat& dst, uint16_t height, uint16_t width) { ap_uint<13> i, j, k, l; // clang-format off #pragma HLS DATAFLOW // clang-format on XF_TNAME(DST_T, NPC) pxl_pack_out; XF_TNAME(SRC_T, NPC) pxl_pack1, pxl_pack2; RowLoop: for (i = 0; i < height; i++) { // clang-format off #pragma HLS LOOP_FLATTEN off #pragma HLS LOOP_TRIPCOUNT min=ROWS max=ROWS // clang-format on ColLoop: for (j = 0; j < width; j++) { // clang-format off #pragma HLS LOOP_TRIPCOUNT min=TC max=TC #pragma HLS pipeline // clang-format on int y; pxl_pack1 = (XF_SNAME(WORDWIDTH_SRC))src1.read(i * width + j); pxl_pack2 = (XF_SNAME(WORDWIDTH_SRC))src2.read(i * width + j); ProcLoop: for (k = 0, l = 0; k < ((8 << XF_BITSHIFT(NPC)) * PLANES); k += XF_IN_STEP, l += XF_OUT_STEP) { // clang-format off #pragma HLS UNROLL // clang-format on XF_CTUNAME(SRC_T, NPC) pxl1 = pxl_pack1.range(k + 7, k); XF_CTUNAME(SRC_T, NPC) pxl2 = pxl_pack2.range(k + 7, k); XF_CTUNAME(DST_T, NPC) t = (pxl1 * pxl1); pxl_pack_out.range(l + XF_OUT_STEP - 1, l) = t + pxl2; } dst.write(i * width + j, (XF_SNAME(WORDWIDTH_DST))pxl_pack_out); } } return 0; } template void accumulateSquare(xf::cv::Mat& src1, xf::cv::Mat& src2, xf::cv::Mat& dst) { #ifndef __SYNTHESIS__ assert(((SRC_T == XF_8UC1) || (SRC_T == XF_8UC3)) && "Input TYPE must be XF_8UC1 for 1-channel and XF_8UC3 for 3-channel image"); assert(((DST_T == XF_16UC1) || (DST_T == XF_16UC3)) && "Output TYPE must be XF_16UC1 for 1-channel and XF_16UC3 for 3-channel image"); assert(((src1.rows == src2.rows) && (src1.cols == src2.cols)) && "Both input images should have same size"); assert(((src1.rows == dst.rows) && (src1.cols == dst.cols)) && "Input and output image should be of same size"); assert(((src1.rows <= ROWS) && (src1.cols <= COLS)) && "ROWS and COLS should be greater than input image"); assert(((NPC == XF_NPPC1) || (NPC == XF_NPPC8)) && "NPC must be XF_NPPC1, XF_NPPC8 "); #endif short width = src1.cols >> XF_BITSHIFT(NPC); // clang-format off #pragma HLS INLINE OFF // clang-format on AcuumulateSquaredKernel> XF_BITSHIFT(NPC))>(src1, src2, dst, src1.rows, width); } } // namespace cv } // namespace xf #endif //_XF_ACCUMULATE_SQUARED_HPP_