!15584 faster_rcnn mask_rcnn mindir 310推理
From: @yuzhenhua666 Reviewed-by: @oacjiewen,@c_34 Signed-off-by: @c_34
This commit is contained in:
commit
196d65c0bd
|
@ -177,7 +177,7 @@ sh run_eval_ascend.sh [VALIDATION_JSON_FILE] [CHECKPOINT_PATH]
|
|||
|
||||
```shell
|
||||
# inference
|
||||
sh run_infer_310.sh [AIR_PATH] [DATA_PATH] [ANN_FILE_PATH]
|
||||
sh run_infer_310.sh [MINDIR_PATH] [DATA_PATH] [ANN_FILE] [DEVICE_ID]
|
||||
```
|
||||
|
||||
# Script Description
|
||||
|
@ -210,7 +210,6 @@ sh run_infer_310.sh [AIR_PATH] [DATA_PATH] [ANN_FILE_PATH]
|
|||
├─resnet50.py // backbone network
|
||||
├─roi_align.py // roi align network
|
||||
└─rpn.py // region proposal network
|
||||
├─aipp.cfg // aipp config file
|
||||
├─config.py // total config
|
||||
├─dataset.py // create dataset and process dataset
|
||||
├─lr_schedule.py // learning ratio generator
|
||||
|
@ -339,7 +338,7 @@ Eval result will be stored in the example path, whose folder name is "eval". Und
|
|||
python export.py --ckpt_file [CKPT_PATH] --device_target [DEVICE_TARGET] --file_format[EXPORT_FORMAT]
|
||||
```
|
||||
|
||||
`EXPORT_FORMAT` should be in ["AIR", "ONNX", "MINDIR"]
|
||||
`EXPORT_FORMAT` should be in ["AIR", "MINDIR"]
|
||||
|
||||
## Inference Process
|
||||
|
||||
|
@ -349,7 +348,7 @@ Before performing inference, the air file must bu exported by export script on t
|
|||
|
||||
```shell
|
||||
# Ascend310 inference
|
||||
sh run_infer_310.sh [AIR_PATH] [DATA_PATH] [ANN_FILE_PATH]
|
||||
sh run_infer_310.sh [MINDIR_PATH] [DATA_PATH] [ANN_FILE] [DEVICE_ID]
|
||||
```
|
||||
|
||||
### result
|
||||
|
|
|
@ -120,7 +120,7 @@ sh run_distribute_train_ascend.sh [RANK_TABLE_FILE] [PRETRAINED_MODEL]
|
|||
sh run_eval_ascend.sh [VALIDATION_JSON_FILE] [CHECKPOINT_PATH]
|
||||
|
||||
#推理
|
||||
sh run_infer_310.sh [AIR_PATH] [DATA_PATH] [ANN_FILE_PATH] [DEVICE_ID]
|
||||
sh run_infer_310.sh [MINDIR_PATH] [DATA_PATH] [ANN_FILE] [DEVICE_ID]
|
||||
```
|
||||
|
||||
## 在GPU上运行
|
||||
|
@ -211,7 +211,6 @@ sh run_infer_310.sh [AIR_PATH] [DATA_PATH] [ANN_FILE_PATH] [DEVICE_ID]
|
|||
├─resnet50.py // 骨干网络
|
||||
├─roi_align.py // ROI对齐网络
|
||||
└─rpn.py // 区域候选网络
|
||||
├─aipp.cfg // aipp 配置文件
|
||||
├─config.py // 总配置
|
||||
├─dataset.py // 创建并处理数据集
|
||||
├─lr_schedule.py // 学习率生成器
|
||||
|
@ -340,7 +339,7 @@ sh run_eval_gpu.sh [VALIDATION_JSON_FILE] [CHECKPOINT_PATH]
|
|||
python export.py --ckpt_file [CKPT_PATH] --device_target [DEVICE_TARGET] --file_format[EXPORT_FORMAT]
|
||||
```
|
||||
|
||||
`EXPORT_FORMAT` 可选 ["AIR", "ONNX", "MINDIR"]
|
||||
`EXPORT_FORMAT` 可选 ["AIR", "MINDIR"]
|
||||
|
||||
## 推理过程
|
||||
|
||||
|
@ -350,7 +349,7 @@ python export.py --ckpt_file [CKPT_PATH] --device_target [DEVICE_TARGET] --file_
|
|||
|
||||
```shell
|
||||
# Ascend310 inference
|
||||
sh run_infer_310.sh [AIR_PATH] [DATA_PATH] [ANN_FILE_PATH] [DEVICE_ID]
|
||||
sh run_infer_310.sh [MINDIR_PATH] [DATA_PATH] [ANN_FILE] [DEVICE_ID]
|
||||
```
|
||||
|
||||
### 结果
|
||||
|
|
|
@ -0,0 +1,14 @@
|
|||
cmake_minimum_required(VERSION 3.14.1)
|
||||
project(Ascend310Infer)
|
||||
add_compile_definitions(_GLIBCXX_USE_CXX11_ABI=0)
|
||||
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -O0 -g -std=c++17 -Werror -Wall -fPIE -Wl,--allow-shlib-undefined")
|
||||
set(PROJECT_SRC_ROOT ${CMAKE_CURRENT_LIST_DIR}/)
|
||||
option(MINDSPORE_PATH "mindspore install path" "")
|
||||
include_directories(${MINDSPORE_PATH})
|
||||
include_directories(${MINDSPORE_PATH}/include)
|
||||
include_directories(${PROJECT_SRC_ROOT})
|
||||
find_library(MS_LIB libmindspore.so ${MINDSPORE_PATH}/lib)
|
||||
file(GLOB_RECURSE MD_LIB ${MINDSPORE_PATH}/_c_dataengine*)
|
||||
|
||||
add_executable(main src/main.cc src/utils.cc)
|
||||
target_link_libraries(main ${MS_LIB} ${MD_LIB} gflags)
|
|
@ -0,0 +1,29 @@
|
|||
#!/bin/bash
|
||||
# Copyright 2021 Huawei Technologies Co., Ltd
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
# ============================================================================
|
||||
if [ -d out ]; then
|
||||
rm -rf out
|
||||
fi
|
||||
|
||||
mkdir out
|
||||
cd out || exit
|
||||
|
||||
if [ -f "Makefile" ]; then
|
||||
make clean
|
||||
fi
|
||||
|
||||
cmake .. \
|
||||
-DMINDSPORE_PATH="`pip3.7 show mindspore-ascend | grep Location | awk '{print $2"/mindspore"}' | xargs realpath`"
|
||||
make
|
|
@ -1,62 +0,0 @@
|
|||
/*
|
||||
* Copyright (c) 2020.Huawei Technologies Co., Ltd. All rights reserved.
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#ifndef ACLMANAGER_H
|
||||
#define ACLMANAGER_H
|
||||
|
||||
#include <map>
|
||||
#include <iostream>
|
||||
#include <string>
|
||||
#include <memory>
|
||||
#include <vector>
|
||||
#include "acl/acl.h"
|
||||
#include "CommonDataType.h"
|
||||
#include "ModelProcess.h"
|
||||
#include "DvppCommon.h"
|
||||
|
||||
struct ModelInfo {
|
||||
std::string modelPath;
|
||||
uint32_t modelWidth;
|
||||
uint32_t modelHeight;
|
||||
uint32_t outputNum;
|
||||
};
|
||||
|
||||
class AclProcess {
|
||||
public:
|
||||
AclProcess(int deviceId, const std::string &om_path, uint32_t width, uint32_t height);
|
||||
~AclProcess() {}
|
||||
void Release();
|
||||
int InitResource();
|
||||
int Process(const std::string& imageFile, std::map<double, double> *costTime_map);
|
||||
|
||||
private:
|
||||
int InitModule();
|
||||
int Preprocess(const std::string& imageFile);
|
||||
int ModelInfer(std::map<double, double> *costTime_map);
|
||||
int WriteResult(const std::string& imageFile);
|
||||
int ReadFile(const std::string &filePath, RawData *fileData);
|
||||
|
||||
int32_t deviceId_;
|
||||
ModelInfo modelInfo_;
|
||||
aclrtContext context_;
|
||||
aclrtStream stream_;
|
||||
std::shared_ptr<ModelProcess> modelProcess_;
|
||||
std::shared_ptr<DvppCommon> dvppCommon_;
|
||||
bool keepRatio_;
|
||||
std::vector<void *> outputBuffers_;
|
||||
std::vector<size_t> outputSizes_;
|
||||
};
|
||||
|
||||
#endif
|
|
@ -1,95 +0,0 @@
|
|||
/*
|
||||
* Copyright (c) 2020.Huawei Technologies Co., Ltd. All rights reserved.
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#ifndef COMMONDATATYPE_H
|
||||
#define COMMONDATATYPE_H
|
||||
|
||||
#include <stdio.h>
|
||||
#include <iostream>
|
||||
#include <memory>
|
||||
#include <vector>
|
||||
#include "acl/acl.h"
|
||||
#include "acl/ops/acl_dvpp.h"
|
||||
|
||||
#define DVPP_ALIGN_UP(x, align) ((((x) + ((align)-1)) / (align)) * (align))
|
||||
|
||||
#define OK 0
|
||||
#define ERROR -1
|
||||
#define INVALID_POINTER -2
|
||||
#define READ_FILE_FAIL -3
|
||||
#define OPEN_FILE_FAIL -4
|
||||
#define INIT_FAIL -5
|
||||
#define INVALID_PARAM -6
|
||||
#define DECODE_FAIL -7
|
||||
|
||||
const float SEC2MS = 1000.0;
|
||||
const int YUV_BGR_SIZE_CONVERT_3 = 3;
|
||||
const int YUV_BGR_SIZE_CONVERT_2 = 2;
|
||||
const int VPC_WIDTH_ALIGN = 16;
|
||||
const int VPC_HEIGHT_ALIGN = 2;
|
||||
|
||||
// Description of image data
|
||||
struct ImageInfo {
|
||||
uint32_t width; // Image width
|
||||
uint32_t height; // Image height
|
||||
uint32_t lenOfByte; // Size of image data, bytes
|
||||
std::shared_ptr<uint8_t> data; // Smart pointer of image data
|
||||
};
|
||||
|
||||
// Description of data in device
|
||||
struct RawData {
|
||||
size_t lenOfByte; // Size of memory, bytes
|
||||
std::shared_ptr<void> data; // Smart pointer of data
|
||||
};
|
||||
|
||||
// define the structure of an rectangle
|
||||
struct Rectangle {
|
||||
uint32_t leftTopX;
|
||||
uint32_t leftTopY;
|
||||
uint32_t rightBottomX;
|
||||
uint32_t rightBottomY;
|
||||
};
|
||||
|
||||
enum VpcProcessType {
|
||||
VPC_PT_DEFAULT = 0,
|
||||
VPC_PT_PADDING, // Resize with locked ratio and paste on upper left corner
|
||||
VPC_PT_FIT, // Resize with locked ratio and paste on middle location
|
||||
VPC_PT_FILL, // Resize with locked ratio and paste on whole locatin, the input image may be cropped
|
||||
};
|
||||
|
||||
struct DvppDataInfo {
|
||||
uint32_t width = 0; // Width of image
|
||||
uint32_t height = 0; // Height of image
|
||||
uint32_t widthStride = 0; // Width after align up
|
||||
uint32_t heightStride = 0; // Height after align up
|
||||
acldvppPixelFormat format = PIXEL_FORMAT_YUV_SEMIPLANAR_420; // Format of image
|
||||
uint32_t frameId = 0; // Needed by video
|
||||
uint32_t dataSize = 0; // Size of data in byte
|
||||
uint8_t *data = nullptr; // Image data
|
||||
};
|
||||
|
||||
struct CropRoiConfig {
|
||||
uint32_t left;
|
||||
uint32_t right;
|
||||
uint32_t down;
|
||||
uint32_t up;
|
||||
};
|
||||
|
||||
struct DvppCropInputInfo {
|
||||
DvppDataInfo dataInfo;
|
||||
CropRoiConfig roi;
|
||||
};
|
||||
|
||||
#endif
|
|
@ -1,139 +0,0 @@
|
|||
/*
|
||||
* Copyright (c) 2020.Huawei Technologies Co., Ltd. All rights reserved.
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#ifndef DVPP_COMMON_H
|
||||
#define DVPP_COMMON_H
|
||||
#include <memory>
|
||||
|
||||
#include "CommonDataType.h"
|
||||
#include "acl/ops/acl_dvpp.h"
|
||||
|
||||
const int MODULUS_NUM_2 = 2;
|
||||
const uint32_t ODD_NUM_1 = 1;
|
||||
|
||||
const uint32_t JPEGD_STRIDE_WIDTH = 128; // Jpegd module output width need to align up to 128
|
||||
const uint32_t JPEGD_STRIDE_HEIGHT = 16; // Jpegd module output height need to align up to 16
|
||||
const uint32_t VPC_STRIDE_WIDTH = 16; // Vpc module output width need to align up to 16
|
||||
const uint32_t VPC_STRIDE_HEIGHT = 2; // Vpc module output height need to align up to 2
|
||||
const uint32_t YUV422_WIDTH_NU = 2; // Width of YUV422, WidthStride = Width * 2
|
||||
const uint32_t YUV444_RGB_WIDTH_NU = 3; // Width of YUV444 and RGB888, WidthStride = Width * 3
|
||||
const uint32_t XRGB_WIDTH_NU = 4; // Width of XRGB8888, WidthStride = Width * 4
|
||||
const uint32_t JPEG_OFFSET = 8; // Offset of input file for jpegd module
|
||||
const uint32_t MAX_JPEGD_WIDTH = 8192; // Max width of jpegd module
|
||||
const uint32_t MAX_JPEGD_HEIGHT = 8192; // Max height of jpegd module
|
||||
const uint32_t MIN_JPEGD_WIDTH = 32; // Min width of jpegd module
|
||||
const uint32_t MIN_JPEGD_HEIGHT = 32; // Min height of jpegd module
|
||||
const uint32_t MAX_RESIZE_WIDTH = 4096; // Max width stride of resize module
|
||||
const uint32_t MAX_RESIZE_HEIGHT = 4096; // Max height stride of resize module
|
||||
const uint32_t MIN_RESIZE_WIDTH = 32; // Min width stride of resize module
|
||||
const uint32_t MIN_RESIZE_HEIGHT = 6; // Min height stride of resize module
|
||||
const float MIN_RESIZE_SCALE = 0.03125; // Min resize scale of resize module
|
||||
const float MAX_RESIZE_SCALE = 16.0; // Min resize scale of resize module
|
||||
const uint32_t MAX_VPC_WIDTH = 4096; // Max width of picture to VPC(resize/crop)
|
||||
const uint32_t MAX_VPC_HEIGHT = 4096; // Max height of picture to VPC(resize/crop)
|
||||
const uint32_t MIN_VPC_WIDTH = 32; // Min width of picture to VPC(resize/crop)
|
||||
const uint32_t MIN_VPC_HEIGHT = 6; // Min height of picture to VPC(resize/crop)
|
||||
const uint32_t MIN_CROP_WIDTH = 10; // Min width of crop area
|
||||
const uint32_t MIN_CROP_HEIGHT = 6; // Min height of crop area
|
||||
const uint8_t YUV_GREYER_VALUE = 128; // Filling value of the resized YUV image
|
||||
|
||||
#define CONVERT_TO_ODD(NUM) (((NUM) % MODULUS_NUM_2 != 0) ? (NUM) : ((NUM) - 1))
|
||||
#define CONVERT_TO_EVEN(NUM) (((NUM) % MODULUS_NUM_2 == 0) ? (NUM) : ((NUM) - 1))
|
||||
#define CHECK_ODD(num) ((num) % MODULUS_NUM_2 != 0)
|
||||
#define CHECK_EVEN(num) ((num) % MODULUS_NUM_2 == 0)
|
||||
#define RELEASE_DVPP_DATA(dvppDataPtr) do { \
|
||||
int retMacro; \
|
||||
if (dvppDataPtr != nullptr) { \
|
||||
retMacro = acldvppFree(dvppDataPtr); \
|
||||
if (retMacro != OK) { \
|
||||
std::cout << "Failed to free memory on dvpp, ret = " << retMacro << "." << std::endl; \
|
||||
} \
|
||||
dvppDataPtr = nullptr; \
|
||||
} \
|
||||
} while (0);
|
||||
|
||||
class DvppCommon {
|
||||
public:
|
||||
explicit DvppCommon(aclrtStream dvppStream);
|
||||
~DvppCommon();
|
||||
int Init(void);
|
||||
int DeInit(void);
|
||||
|
||||
static int GetVpcDataSize(uint32_t widthVpc, uint32_t heightVpc, acldvppPixelFormat format,
|
||||
uint32_t *vpcSize);
|
||||
|
||||
static int GetVpcInputStrideSize(uint32_t width, uint32_t height, acldvppPixelFormat format,
|
||||
uint32_t *widthStride, uint32_t *heightStride);
|
||||
|
||||
static int GetVpcOutputStrideSize(uint32_t width, uint32_t height, acldvppPixelFormat format,
|
||||
uint32_t *widthStride, uint32_t *heightStride);
|
||||
|
||||
static void GetJpegDecodeStrideSize(uint32_t width, uint32_t height, uint32_t *widthStride, uint32_t *heightStride);
|
||||
static int GetJpegImageInfo(const void *data, uint32_t dataSize, uint32_t *width, uint32_t *height,
|
||||
int32_t *components);
|
||||
|
||||
static int GetJpegDecodeDataSize(const void *data, uint32_t dataSize, acldvppPixelFormat format,
|
||||
uint32_t *decSize);
|
||||
|
||||
int VpcResize(std::shared_ptr<DvppDataInfo> input, std::shared_ptr<DvppDataInfo> output, bool withSynchronize,
|
||||
VpcProcessType processType = VPC_PT_DEFAULT);
|
||||
|
||||
int JpegDecode(std::shared_ptr<DvppDataInfo> input, std::shared_ptr<DvppDataInfo> output, bool withSynchronize);
|
||||
|
||||
int CombineResizeProcess(std::shared_ptr<DvppDataInfo> input, const DvppDataInfo &output, bool withSynchronize,
|
||||
VpcProcessType processType = VPC_PT_DEFAULT);
|
||||
|
||||
int CombineJpegdProcess(const RawData& imageInfo, acldvppPixelFormat format, bool withSynchronize);
|
||||
|
||||
std::shared_ptr<DvppDataInfo> GetInputImage();
|
||||
std::shared_ptr<DvppDataInfo> GetDecodedImage();
|
||||
std::shared_ptr<DvppDataInfo> GetResizedImage();
|
||||
|
||||
void ReleaseDvppBuffer();
|
||||
|
||||
private:
|
||||
int SetDvppPicDescData(std::shared_ptr<DvppDataInfo> dataInfo, std::shared_ptr<acldvppPicDesc>picDesc);
|
||||
int ResizeProcess(std::shared_ptr<acldvppPicDesc> inputDesc,
|
||||
std::shared_ptr<acldvppPicDesc> outputDesc, bool withSynchronize);
|
||||
|
||||
int ResizeWithPadding(std::shared_ptr<acldvppPicDesc> inputDesc, std::shared_ptr<acldvppPicDesc> outputDesc,
|
||||
const CropRoiConfig &cropRoi, const CropRoiConfig &pasteRoi, bool withSynchronize);
|
||||
|
||||
void GetCropRoi(std::shared_ptr<DvppDataInfo> input, std::shared_ptr<DvppDataInfo> output,
|
||||
VpcProcessType processType, CropRoiConfig *cropRoi);
|
||||
|
||||
void GetPasteRoi(std::shared_ptr<DvppDataInfo> input, std::shared_ptr<DvppDataInfo> output,
|
||||
VpcProcessType processType, CropRoiConfig *pasteRoi);
|
||||
|
||||
int CheckResizeParams(const DvppDataInfo &input, const DvppDataInfo &output);
|
||||
int TransferImageH2D(const RawData& imageInfo, const std::shared_ptr<DvppDataInfo>& jpegInput);
|
||||
int CreateStreamDesc(std::shared_ptr<DvppDataInfo> data);
|
||||
int DestroyResource();
|
||||
|
||||
std::shared_ptr<acldvppRoiConfig> cropAreaConfig_ = nullptr;
|
||||
std::shared_ptr<acldvppRoiConfig> pasteAreaConfig_ = nullptr;
|
||||
|
||||
std::shared_ptr<acldvppPicDesc> resizeInputDesc_ = nullptr;
|
||||
std::shared_ptr<acldvppPicDesc> resizeOutputDesc_ = nullptr;
|
||||
std::shared_ptr<acldvppPicDesc> decodeOutputDesc_ = nullptr;
|
||||
std::shared_ptr<acldvppResizeConfig> resizeConfig_ = nullptr;
|
||||
|
||||
acldvppChannelDesc *dvppChannelDesc_ = nullptr;
|
||||
aclrtStream dvppStream_ = nullptr;
|
||||
std::shared_ptr<DvppDataInfo> inputImage_ = nullptr;
|
||||
std::shared_ptr<DvppDataInfo> decodedImage_ = nullptr;
|
||||
std::shared_ptr<DvppDataInfo> resizedImage_ = nullptr;
|
||||
};
|
||||
#endif
|
|
@ -1,63 +0,0 @@
|
|||
/*
|
||||
* Copyright(C) 2020. Huawei Technologies Co.,Ltd. All rights reserved.
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#ifndef MODELPROCSS_H
|
||||
#define MODELPROCSS_H
|
||||
|
||||
#include <cstdio>
|
||||
#include <vector>
|
||||
#include <unordered_map>
|
||||
#include <mutex>
|
||||
#include <map>
|
||||
#include <memory>
|
||||
#include <string>
|
||||
#include "acl/acl.h"
|
||||
#include "CommonDataType.h"
|
||||
|
||||
class ModelProcess {
|
||||
public:
|
||||
explicit ModelProcess(const int deviceId);
|
||||
ModelProcess();
|
||||
~ModelProcess();
|
||||
|
||||
int Init(const std::string &modelPath);
|
||||
int DeInit();
|
||||
|
||||
int ModelInference(const std::vector<void *> &inputBufs,
|
||||
const std::vector<size_t> &inputSizes,
|
||||
const std::vector<void *> &ouputBufs,
|
||||
const std::vector<size_t> &outputSizes,
|
||||
std::map<double, double> *costTime_map);
|
||||
aclmdlDesc *GetModelDesc();
|
||||
int ReadBinaryFile(const std::string &fileName, uint8_t **buffShared, int *buffLength);
|
||||
|
||||
private:
|
||||
aclmdlDataset *CreateAndFillDataset(const std::vector<void *> &bufs, const std::vector<size_t> &sizes);
|
||||
void DestroyDataset(aclmdlDataset *dataset);
|
||||
|
||||
std::mutex mtx_ = {};
|
||||
int deviceId_ = 0;
|
||||
uint32_t modelId_ = 0;
|
||||
void *modelDevPtr_ = nullptr;
|
||||
size_t modelDevPtrSize_ = 0;
|
||||
void *weightDevPtr_ = nullptr;
|
||||
size_t weightDevPtrSize_ = 0;
|
||||
aclrtContext contextModel_ = nullptr;
|
||||
std::shared_ptr<aclmdlDesc> modelDesc_ = nullptr;
|
||||
bool isDeInit_ = false;
|
||||
};
|
||||
|
||||
#endif
|
|
@ -0,0 +1,32 @@
|
|||
/**
|
||||
* Copyright 2021 Huawei Technologies Co., Ltd
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#ifndef MINDSPORE_INFERENCE_UTILS_H_
|
||||
#define MINDSPORE_INFERENCE_UTILS_H_
|
||||
|
||||
#include <sys/stat.h>
|
||||
#include <dirent.h>
|
||||
#include <vector>
|
||||
#include <string>
|
||||
#include <memory>
|
||||
#include "include/api/types.h"
|
||||
|
||||
std::vector<std::string> GetAllFiles(std::string_view dirName);
|
||||
DIR *OpenDir(std::string_view dirName);
|
||||
std::string RealPath(std::string_view path);
|
||||
mindspore::MSTensor ReadFileToTensor(const std::string &file);
|
||||
int WriteResult(const std::string& imageFile, const std::vector<mindspore::MSTensor> &outputs);
|
||||
#endif
|
|
@ -1,367 +0,0 @@
|
|||
/*
|
||||
* Copyright (c) 2020.Huawei Technologies Co., Ltd. All rights reserved.
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#include "AclProcess.h"
|
||||
#include <sys/time.h>
|
||||
#include <thread>
|
||||
#include <string>
|
||||
|
||||
/*
|
||||
* @description Implementation of constructor for class AclProcess with parameter list
|
||||
* @attention context is passed in as a parameter after being created in ResourceManager::InitResource
|
||||
*/
|
||||
AclProcess::AclProcess(int deviceId, const std::string &om_path, uint32_t width, uint32_t height)
|
||||
: deviceId_(deviceId), stream_(nullptr), modelProcess_(nullptr), dvppCommon_(nullptr), keepRatio_(true) {
|
||||
modelInfo_.modelPath = om_path;
|
||||
modelInfo_.modelWidth = width;
|
||||
modelInfo_.modelHeight = height;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description Release all the resource
|
||||
* @attention context will be released in ResourceManager::Release
|
||||
*/
|
||||
void AclProcess::Release() {
|
||||
// Synchronize stream and release Dvpp channel
|
||||
dvppCommon_->DeInit();
|
||||
// Release stream
|
||||
if (stream_ != nullptr) {
|
||||
int ret = aclrtDestroyStream(stream_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to destroy the stream, ret = " << ret << ".";
|
||||
}
|
||||
stream_ = nullptr;
|
||||
}
|
||||
// Destroy resources of modelProcess_
|
||||
modelProcess_->DeInit();
|
||||
|
||||
// Release Dvpp buffer
|
||||
dvppCommon_->ReleaseDvppBuffer();
|
||||
|
||||
return;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description Initialize the modules used by this sample
|
||||
* @return int int code
|
||||
*/
|
||||
int AclProcess::InitModule() {
|
||||
// Create Dvpp common object
|
||||
if (dvppCommon_ == nullptr) {
|
||||
dvppCommon_ = std::make_shared<DvppCommon>(stream_);
|
||||
int retDvppCommon = dvppCommon_->Init();
|
||||
if (retDvppCommon != OK) {
|
||||
std::cout << "Failed to initialize dvppCommon, ret = " << retDvppCommon << std::endl;
|
||||
return retDvppCommon;
|
||||
}
|
||||
}
|
||||
// Create model inference object
|
||||
if (modelProcess_ == nullptr) {
|
||||
modelProcess_ = std::make_shared<ModelProcess>(deviceId_);
|
||||
}
|
||||
// Initialize ModelProcess module
|
||||
int ret = modelProcess_->Init(modelInfo_.modelPath);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to initialize the model process module, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
std::cout << "Initialized the model process module successfully." << std::endl;
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description Create resource for this sample
|
||||
* @return int int code
|
||||
*/
|
||||
int AclProcess::InitResource() {
|
||||
int ret = aclInit(nullptr); // Initialize ACL
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to init acl, ret = " << ret << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = aclrtSetDevice(deviceId_);
|
||||
if (ret != ACL_SUCCESS) {
|
||||
std::cout << "acl set device " << deviceId_ << "intCode = "<< static_cast<int32_t>(ret) << std::endl;
|
||||
return ret;
|
||||
}
|
||||
std::cout << "set device "<< deviceId_ << " success" << std::endl;
|
||||
|
||||
// create context (set current)
|
||||
ret = aclrtCreateContext(&context_, deviceId_);
|
||||
if (ret != ACL_SUCCESS) {
|
||||
std::cout << "acl create context failed, deviceId = " << deviceId_ <<
|
||||
"intCode = "<< static_cast<int32_t>(ret) << std::endl;
|
||||
return ret;
|
||||
}
|
||||
std::cout << "create context success" << std::endl;
|
||||
|
||||
ret = aclrtCreateStream(&stream_); // Create stream for application
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to create the acl stream, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
std::cout << "Created the acl stream successfully." << std::endl;
|
||||
// Initialize dvpp module
|
||||
if (InitModule() != OK) {
|
||||
return INIT_FAIL;
|
||||
}
|
||||
|
||||
aclmdlDesc *modelDesc = modelProcess_->GetModelDesc();
|
||||
size_t outputSize = aclmdlGetNumOutputs(modelDesc);
|
||||
modelInfo_.outputNum = outputSize;
|
||||
for (size_t i = 0; i < outputSize; i++) {
|
||||
size_t bufferSize = aclmdlGetOutputSizeByIndex(modelDesc, i);
|
||||
void *outputBuffer = nullptr;
|
||||
ret = aclrtMalloc(&outputBuffer, bufferSize, ACL_MEM_MALLOC_NORMAL_ONLY);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to malloc buffer, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
outputBuffers_.push_back(outputBuffer);
|
||||
outputSizes_.push_back(bufferSize);
|
||||
}
|
||||
|
||||
return OK;
|
||||
}
|
||||
|
||||
int AclProcess::WriteResult(const std::string& imageFile) {
|
||||
std::string homePath = "./result_Files";
|
||||
void *resHostBuf = nullptr;
|
||||
for (size_t i = 0; i < outputBuffers_.size(); ++i) {
|
||||
size_t output_size;
|
||||
void *netOutput;
|
||||
netOutput = outputBuffers_[i];
|
||||
output_size = outputSizes_[i];
|
||||
int ret = aclrtMallocHost(&resHostBuf, output_size);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to print the result, malloc host failed, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = aclrtMemcpy(resHostBuf, output_size, netOutput,
|
||||
output_size, ACL_MEMCPY_DEVICE_TO_HOST);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to print result, memcpy device to host failed, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
int pos = imageFile.rfind('/');
|
||||
std::string fileName(imageFile, pos + 1);
|
||||
fileName.replace(fileName.find('.'), fileName.size() - fileName.find('.'), "_" + std::to_string(i) + ".bin");
|
||||
|
||||
std::string outFileName = homePath + "/" + fileName;
|
||||
try {
|
||||
FILE *outputFile = fopen(outFileName.c_str(), "wb");
|
||||
if (outputFile == nullptr) {
|
||||
std::cout << "open result file " << outFileName << " failed" << std::endl;
|
||||
return INVALID_POINTER;
|
||||
}
|
||||
size_t size = fwrite(resHostBuf, sizeof(char), output_size, outputFile);
|
||||
if (size != output_size) {
|
||||
fclose(outputFile);
|
||||
outputFile = nullptr;
|
||||
std::cout << "write result file " << outFileName << " failed, write size[" << size <<
|
||||
"] is smaller than output size[" << output_size << "], maybe the disk is full." << std::endl;
|
||||
return ERROR;
|
||||
}
|
||||
|
||||
fclose(outputFile);
|
||||
outputFile = nullptr;
|
||||
} catch (std::exception &e) {
|
||||
std::cout << "write result file " << outFileName << " failed, error info: " << e.what() << std::endl;
|
||||
std::exit(1);
|
||||
}
|
||||
|
||||
ret = aclrtFreeHost(resHostBuf);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclrtFree host output memory failed" << std::endl;
|
||||
return ret;
|
||||
}
|
||||
}
|
||||
return OK;
|
||||
}
|
||||
|
||||
/**
|
||||
* Read a file, store it into the RawData structure
|
||||
*
|
||||
* @param filePath file to read to
|
||||
* @param fileData RawData structure to store in
|
||||
* @return OK if create success, int code otherwise
|
||||
*/
|
||||
int AclProcess::ReadFile(const std::string &filePath, RawData *fileData) {
|
||||
// Open file with reading mode
|
||||
FILE *fp = fopen(filePath.c_str(), "rb");
|
||||
if (fp == nullptr) {
|
||||
std::cout << "Failed to open file, filePath = " << filePath << std::endl;
|
||||
return OPEN_FILE_FAIL;
|
||||
}
|
||||
// Get the length of input file
|
||||
fseek(fp, 0, SEEK_END);
|
||||
size_t fileSize = ftell(fp);
|
||||
fseek(fp, 0, SEEK_SET);
|
||||
// If file not empty, read it into FileInfo and return it
|
||||
if (fileSize > 0) {
|
||||
fileData->lenOfByte = fileSize;
|
||||
fileData->data = std::make_shared<uint8_t>();
|
||||
fileData->data.reset(new uint8_t[fileSize], std::default_delete<uint8_t[]>());
|
||||
uint32_t readRet = fread(fileData->data.get(), 1, fileSize, fp);
|
||||
if (readRet == 0) {
|
||||
fclose(fp);
|
||||
return READ_FILE_FAIL;
|
||||
}
|
||||
fclose(fp);
|
||||
return OK;
|
||||
}
|
||||
fclose(fp);
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
/*
|
||||
* @description Preprocess the input image
|
||||
* @param imageFile input image path
|
||||
* @return int int code
|
||||
*/
|
||||
int AclProcess::Preprocess(const std::string& imageFile) {
|
||||
RawData imageInfo;
|
||||
int ret = ReadFile(imageFile, &imageInfo); // Read image data from input image file
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to read file, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
// Run process of jpegD
|
||||
ret = dvppCommon_->CombineJpegdProcess(imageInfo, PIXEL_FORMAT_YUV_SEMIPLANAR_420, true);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to execute image decoded of preprocess module, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
// Get output of decode jpeg image
|
||||
std::shared_ptr<DvppDataInfo> decodeOutData = dvppCommon_->GetDecodedImage();
|
||||
// Run resize application function
|
||||
DvppDataInfo resizeOutData;
|
||||
resizeOutData.height = modelInfo_.modelHeight;
|
||||
resizeOutData.width = modelInfo_.modelWidth;
|
||||
resizeOutData.format = PIXEL_FORMAT_YUV_SEMIPLANAR_420;
|
||||
ret = dvppCommon_->CombineResizeProcess(decodeOutData, resizeOutData, true, VPC_PT_PADDING);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to execute image resized of preprocess module, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
RELEASE_DVPP_DATA(decodeOutData->data);
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description Inference of model
|
||||
* @return int int code
|
||||
*/
|
||||
int AclProcess::ModelInfer(std::map<double, double> *costTime_map) {
|
||||
// Get output of resize module
|
||||
std::shared_ptr<DvppDataInfo> resizeOutData = dvppCommon_->GetResizedImage();
|
||||
std::shared_ptr<DvppDataInfo> inputImg = dvppCommon_->GetInputImage();
|
||||
|
||||
float widthScale, heightScale;
|
||||
if (keepRatio_) {
|
||||
widthScale = static_cast<float>(resizeOutData->width) / inputImg->width;
|
||||
if (widthScale > static_cast<float>(resizeOutData->height) / inputImg->height) {
|
||||
widthScale = static_cast<float>(resizeOutData->height) / inputImg->height;
|
||||
}
|
||||
heightScale = widthScale;
|
||||
} else {
|
||||
widthScale = static_cast<float>(resizeOutData->width) / inputImg->width;
|
||||
heightScale = static_cast<float>(resizeOutData->height) / inputImg->height;
|
||||
}
|
||||
|
||||
float im_info[4];
|
||||
im_info[0] = static_cast<float>(inputImg->height);
|
||||
im_info[1] = static_cast<float>(inputImg->width);
|
||||
im_info[2] = heightScale;
|
||||
im_info[3] = widthScale;
|
||||
void *imInfo_dst = nullptr;
|
||||
int ret = aclrtMalloc(&imInfo_dst, 16, ACL_MEM_MALLOC_NORMAL_ONLY);
|
||||
if (ret != ACL_ERROR_NONE) {
|
||||
std::cout << "aclrtMalloc failed, ret = " << ret << std::endl;
|
||||
aclrtFree(imInfo_dst);
|
||||
return ret;
|
||||
}
|
||||
ret = aclrtMemcpy(reinterpret_cast<uint8_t *>(imInfo_dst), 16, im_info, 16, ACL_MEMCPY_HOST_TO_DEVICE);
|
||||
if (ret != ACL_ERROR_NONE) {
|
||||
std::cout << "aclrtMemcpy failed, ret = " << ret << std::endl;
|
||||
aclrtFree(imInfo_dst);
|
||||
return ret;
|
||||
}
|
||||
|
||||
std::vector<void *> inputBuffers({resizeOutData->data, imInfo_dst});
|
||||
std::vector<size_t> inputSizes({resizeOutData->dataSize, 4 * 4});
|
||||
|
||||
for (size_t i = 0; i < modelInfo_.outputNum; i++) {
|
||||
aclrtMemset(outputBuffers_[i], outputSizes_[i], 0, outputSizes_[i]);
|
||||
}
|
||||
// Execute classification model
|
||||
ret = modelProcess_->ModelInference(inputBuffers, inputSizes, outputBuffers_, outputSizes_, costTime_map);
|
||||
if (ret != OK) {
|
||||
aclrtFree(imInfo_dst);
|
||||
std::cout << "Failed to execute the classification model, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = aclrtFree(imInfo_dst);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclrtFree image info failed" << std::endl;
|
||||
return ret;
|
||||
}
|
||||
RELEASE_DVPP_DATA(resizeOutData->data);
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description Process classification
|
||||
*
|
||||
* @par Function
|
||||
* 1.Dvpp module preprocess
|
||||
* 2.Execute classification model
|
||||
* 3.Execute single operator
|
||||
* 4.Write result
|
||||
*
|
||||
* @param imageFile input file path
|
||||
* @return int int code
|
||||
*/
|
||||
|
||||
int AclProcess::Process(const std::string& imageFile, std::map<double, double> *costTime_map) {
|
||||
struct timeval begin = {0};
|
||||
struct timeval end = {0};
|
||||
gettimeofday(&begin, nullptr);
|
||||
|
||||
int ret = Preprocess(imageFile);
|
||||
if (ret != OK) {
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = ModelInfer(costTime_map);
|
||||
if (ret != OK) {
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = WriteResult(imageFile);
|
||||
if (ret != OK) {
|
||||
std::cout << "write result failed." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
gettimeofday(&end, nullptr);
|
||||
|
||||
const double costMs = SEC2MS * (end.tv_sec - begin.tv_sec) + (end.tv_usec - begin.tv_usec) / SEC2MS;
|
||||
std::cout << "[Process Delay] cost: " << costMs << "ms." << std::endl;
|
||||
return OK;
|
||||
}
|
|
@ -1,42 +0,0 @@
|
|||
# Copyright (c) Huawei Technologies Co., Ltd. 2020. All rights reserved.
|
||||
|
||||
# CMake lowest version requirement
|
||||
cmake_minimum_required(VERSION 3.5.1)
|
||||
# Add definitions ENABLE_DVPP_INTERFACE to use dvpp api
|
||||
add_definitions(-DENABLE_DVPP_INTERFACE)
|
||||
# project information
|
||||
project(InferClassification)
|
||||
# Check environment variable
|
||||
if(NOT DEFINED ENV{ASCEND_HOME})
|
||||
message(FATAL_ERROR "please define environment variable:ASCEND_HOME")
|
||||
endif()
|
||||
|
||||
# Compile options
|
||||
add_compile_options(-std=c++11 -fPIE -g -fstack-protector-all -Werror -Wreturn-type)
|
||||
|
||||
# Skip build rpath
|
||||
set(CMAKE_SKIP_BUILD_RPATH True)
|
||||
|
||||
# Set output directory
|
||||
set(PROJECT_SRC_ROOT ${CMAKE_CURRENT_LIST_DIR}/)
|
||||
set(CMAKE_RUNTIME_OUTPUT_DIRECTORY ${PROJECT_SRC_ROOT}/out)
|
||||
|
||||
# Set include directory and library directory
|
||||
set(ACL_LIB_DIR $ENV{ASCEND_HOME}/acllib)
|
||||
set(ATLAS_ACL_LIB_DIR $ENV{ASCEND_HOME}/ascend-toolkit/latest/acllib)
|
||||
# Header path
|
||||
include_directories(${ACL_LIB_DIR}/include/)
|
||||
include_directories(${ATLAS_ACL_LIB_DIR}/include/)
|
||||
include_directories(${PROJECT_SRC_ROOT}/../inc)
|
||||
|
||||
# add host lib path
|
||||
link_directories(${ACL_LIB_DIR})
|
||||
find_library(acl libascendcl.so ${ACL_LIB_DIR}/lib64 ${ATLAS_ACL_LIB_DIR}/lib64)
|
||||
find_library(acl_dvpp libacl_dvpp.so ${ACL_LIB_DIR}/lib64 ${ATLAS_ACL_LIB_DIR}/lib64)
|
||||
|
||||
add_executable(main AclProcess.cpp
|
||||
DvppCommon.cpp
|
||||
ModelProcess.cpp
|
||||
main.cpp)
|
||||
|
||||
target_link_libraries(main ${acl} gflags ${acl_dvpp} pthread)
|
|
@ -1,735 +0,0 @@
|
|||
/*
|
||||
* Copyright (c) 2020.Huawei Technologies Co., Ltd. All rights reserved.
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#include <iostream>
|
||||
#include <memory>
|
||||
|
||||
#include "../inc/DvppCommon.h"
|
||||
#include "../inc/CommonDataType.h"
|
||||
|
||||
static auto g_resizeConfigDeleter = [](acldvppResizeConfig *p) { acldvppDestroyResizeConfig(p); };
|
||||
static auto g_picDescDeleter = [](acldvppPicDesc *picDesc) { acldvppDestroyPicDesc(picDesc); };
|
||||
static auto g_roiConfigDeleter = [](acldvppRoiConfig *p) { acldvppDestroyRoiConfig(p); };
|
||||
|
||||
DvppCommon::DvppCommon(aclrtStream dvppStream):dvppStream_(dvppStream) {}
|
||||
|
||||
/*
|
||||
* @description: Create a channel for processing image data,
|
||||
* the channel description is created by acldvppCreateChannelDesc
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::Init(void) {
|
||||
dvppChannelDesc_ = acldvppCreateChannelDesc();
|
||||
if (dvppChannelDesc_ == nullptr) {
|
||||
return -1;
|
||||
}
|
||||
int ret = acldvppCreateChannel(dvppChannelDesc_);
|
||||
if (ret != 0) {
|
||||
std::cout << "Failed to create dvpp channel, ret = " << ret << "." << std::endl;
|
||||
acldvppDestroyChannelDesc(dvppChannelDesc_);
|
||||
dvppChannelDesc_ = nullptr;
|
||||
return ret;
|
||||
}
|
||||
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: destroy the channel and the channel description used by image.
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::DeInit(void) {
|
||||
int ret = aclrtSynchronizeStream(dvppStream_); // int ret
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to synchronize stream, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = acldvppDestroyChannel(dvppChannelDesc_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to destroy dvpp channel, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = acldvppDestroyChannelDesc(dvppChannelDesc_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to destroy dvpp channel description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Release the memory that is allocated in the interfaces which are started with "Combine"
|
||||
*/
|
||||
void DvppCommon::ReleaseDvppBuffer() {
|
||||
if (resizedImage_ != nullptr) {
|
||||
RELEASE_DVPP_DATA(resizedImage_->data);
|
||||
}
|
||||
if (decodedImage_ != nullptr) {
|
||||
RELEASE_DVPP_DATA(decodedImage_->data);
|
||||
}
|
||||
if (inputImage_ != nullptr) {
|
||||
RELEASE_DVPP_DATA(inputImage_->data);
|
||||
}
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Get the size of buffer used to save image for VPC according to width, height and format
|
||||
* @param width specifies the width of the output image
|
||||
* @param height specifies the height of the output image
|
||||
* @param format specifies the format of the output image
|
||||
* @param: vpcSize is used to save the result size
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::GetVpcDataSize(uint32_t width, uint32_t height, acldvppPixelFormat format, uint32_t *vpcSize) {
|
||||
if (format != PIXEL_FORMAT_YUV_SEMIPLANAR_420 && format != PIXEL_FORMAT_YVU_SEMIPLANAR_420) {
|
||||
std::cout << "Format[" << format << "] for VPC is not supported, just support NV12 or NV21." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
uint32_t widthStride = DVPP_ALIGN_UP(width, VPC_WIDTH_ALIGN);
|
||||
uint32_t heightStride = DVPP_ALIGN_UP(height, VPC_HEIGHT_ALIGN);
|
||||
*vpcSize = widthStride * heightStride * YUV_BGR_SIZE_CONVERT_3 / YUV_BGR_SIZE_CONVERT_2;
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Get the aligned width and height of the input image according to the image format
|
||||
* @param: width specifies the width before alignment
|
||||
* @param: height specifies the height before alignment
|
||||
* @param: format specifies the image format
|
||||
* @param: widthStride is used to save the width after alignment
|
||||
* @param: heightStride is used to save the height after alignment
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::GetVpcInputStrideSize(uint32_t width, uint32_t height, acldvppPixelFormat format,
|
||||
uint32_t *widthStride, uint32_t *heightStride) {
|
||||
uint32_t inputWidthStride;
|
||||
if (format >= PIXEL_FORMAT_YUV_400 && format <= PIXEL_FORMAT_YVU_SEMIPLANAR_444) {
|
||||
inputWidthStride = DVPP_ALIGN_UP(width, VPC_STRIDE_WIDTH);
|
||||
} else if (format >= PIXEL_FORMAT_YUYV_PACKED_422 && format <= PIXEL_FORMAT_VYUY_PACKED_422) {
|
||||
inputWidthStride = DVPP_ALIGN_UP(width, VPC_STRIDE_WIDTH) * YUV422_WIDTH_NU;
|
||||
} else if (format >= PIXEL_FORMAT_YUV_PACKED_444 && format <= PIXEL_FORMAT_BGR_888) {
|
||||
inputWidthStride = DVPP_ALIGN_UP(width, VPC_STRIDE_WIDTH) * YUV444_RGB_WIDTH_NU;
|
||||
} else if (format >= PIXEL_FORMAT_ARGB_8888 && format <= PIXEL_FORMAT_BGRA_8888) {
|
||||
inputWidthStride = DVPP_ALIGN_UP(width, VPC_STRIDE_WIDTH) * XRGB_WIDTH_NU;
|
||||
} else {
|
||||
std::cout << "Input format[" << format << "] for VPC is invalid, please check it." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
uint32_t inputHeightStride = DVPP_ALIGN_UP(height, VPC_STRIDE_HEIGHT);
|
||||
if (inputWidthStride > MAX_RESIZE_WIDTH || inputWidthStride < MIN_RESIZE_WIDTH) {
|
||||
std::cout << "Input width stride " << inputWidthStride << " is invalid, not in [" << MIN_RESIZE_WIDTH \
|
||||
<< ", " << MAX_RESIZE_WIDTH << "]." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
|
||||
if (inputHeightStride > MAX_RESIZE_HEIGHT || inputHeightStride < MIN_RESIZE_HEIGHT) {
|
||||
std::cout << "Input height stride " << inputHeightStride << " is invalid, not in [" << MIN_RESIZE_HEIGHT \
|
||||
<< ", " << MAX_RESIZE_HEIGHT << "]." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
*widthStride = inputWidthStride;
|
||||
*heightStride = inputHeightStride;
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Get the aligned width and height of the output image according to the image format
|
||||
* @param: width specifies the width before alignment
|
||||
* @param: height specifies the height before alignment
|
||||
* @param: format specifies the image format
|
||||
* @param: widthStride is used to save the width after alignment
|
||||
* @param: heightStride is used to save the height after alignment
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::GetVpcOutputStrideSize(uint32_t width, uint32_t height, acldvppPixelFormat format,
|
||||
uint32_t *widthStride, uint32_t *heightStride) {
|
||||
if (format != PIXEL_FORMAT_YUV_SEMIPLANAR_420 && format != PIXEL_FORMAT_YVU_SEMIPLANAR_420) {
|
||||
std::cout << "Output format[" << format << "] is not supported, just support NV12 or NV21." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
|
||||
*widthStride = DVPP_ALIGN_UP(width, VPC_STRIDE_WIDTH);
|
||||
*heightStride = DVPP_ALIGN_UP(height, VPC_STRIDE_HEIGHT);
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Set picture description information and execute resize function
|
||||
* @param: input specifies the input image information
|
||||
* @param: output specifies the output image information
|
||||
* @param: withSynchronize specifies whether to execute synchronously
|
||||
* @param: processType specifies whether to perform proportional scaling, default is non-proportional resize
|
||||
* @return: OK if success, other values if failure
|
||||
* @attention: This function can be called only when the DvppCommon object is initialized with Init
|
||||
*/
|
||||
int DvppCommon::VpcResize(std::shared_ptr<DvppDataInfo> input, std::shared_ptr<DvppDataInfo> output,
|
||||
bool withSynchronize, VpcProcessType processType) {
|
||||
acldvppPicDesc *inputDesc = acldvppCreatePicDesc();
|
||||
acldvppPicDesc *outputDesc = acldvppCreatePicDesc();
|
||||
resizeInputDesc_.reset(inputDesc, g_picDescDeleter);
|
||||
resizeOutputDesc_.reset(outputDesc, g_picDescDeleter);
|
||||
|
||||
// Set dvpp picture descriptin info of input image
|
||||
int ret = SetDvppPicDescData(input, resizeInputDesc_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to set dvpp input picture description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
// Set dvpp picture descriptin info of output image
|
||||
ret = SetDvppPicDescData(output, resizeOutputDesc_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to set dvpp output picture description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
if (processType == VPC_PT_DEFAULT) {
|
||||
return ResizeProcess(resizeInputDesc_, resizeOutputDesc_, withSynchronize);
|
||||
}
|
||||
|
||||
// Get crop area according to the processType
|
||||
CropRoiConfig cropRoi = {0};
|
||||
GetCropRoi(input, output, processType, &cropRoi);
|
||||
|
||||
// The width and height of the original image will be resized by the same ratio
|
||||
CropRoiConfig pasteRoi = {0};
|
||||
GetPasteRoi(input, output, processType, &pasteRoi);
|
||||
|
||||
return ResizeWithPadding(resizeInputDesc_, resizeOutputDesc_, cropRoi, pasteRoi, withSynchronize);
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Set image description information
|
||||
* @param: dataInfo specifies the image information
|
||||
* @param: picsDesc specifies the picture description information to be set
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::SetDvppPicDescData(std::shared_ptr<DvppDataInfo> dataInfo, std::shared_ptr<acldvppPicDesc>picDesc) {
|
||||
int ret = acldvppSetPicDescData(picDesc.get(), dataInfo->data);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to set data for dvpp picture description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = acldvppSetPicDescSize(picDesc.get(), dataInfo->dataSize);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to set size for dvpp picture description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = acldvppSetPicDescFormat(picDesc.get(), dataInfo->format);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to set format for dvpp picture description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = acldvppSetPicDescWidth(picDesc.get(), dataInfo->width);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to set width for dvpp picture description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = acldvppSetPicDescHeight(picDesc.get(), dataInfo->height);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to set height for dvpp picture description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = acldvppSetPicDescWidthStride(picDesc.get(), dataInfo->widthStride);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to set aligned width for dvpp picture description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = acldvppSetPicDescHeightStride(picDesc.get(), dataInfo->heightStride);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to set aligned height for dvpp picture description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Check whether the image format and zoom ratio meet the requirements
|
||||
* @param: input specifies the input image information
|
||||
* @param: output specifies the output image information
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::CheckResizeParams(const DvppDataInfo &input, const DvppDataInfo &output) {
|
||||
if (output.format != PIXEL_FORMAT_YUV_SEMIPLANAR_420 && output.format != PIXEL_FORMAT_YVU_SEMIPLANAR_420) {
|
||||
std::cout << "Output format[" << output.format << "]is not supported, just support NV12 or NV21." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
float heightScale = static_cast<float>(output.height) / input.height;
|
||||
if (heightScale < MIN_RESIZE_SCALE || heightScale > MAX_RESIZE_SCALE) {
|
||||
std::cout << "Resize scale should be in range [1/16, 32], which is " << heightScale << "." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
float widthScale = static_cast<float>(output.width) / input.width;
|
||||
if (widthScale < MIN_RESIZE_SCALE || widthScale > MAX_RESIZE_SCALE) {
|
||||
std::cout << "Resize scale should be in range [1/16, 32], which is " << widthScale << "." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Scale the input image to the size specified by the output image and
|
||||
* saves the result to the output image (non-proportionate scaling)
|
||||
* @param: inputDesc specifies the description information of the input image
|
||||
* @param: outputDesc specifies the description information of the output image
|
||||
* @param: withSynchronize specifies whether to execute synchronously
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::ResizeProcess(std::shared_ptr<acldvppPicDesc>inputDesc,
|
||||
std::shared_ptr<acldvppPicDesc>outputDesc,
|
||||
bool withSynchronize) {
|
||||
acldvppResizeConfig *resizeConfig = acldvppCreateResizeConfig();
|
||||
if (resizeConfig == nullptr) {
|
||||
std::cout << "Failed to create dvpp resize config." << std::endl;
|
||||
return INVALID_POINTER;
|
||||
}
|
||||
|
||||
resizeConfig_.reset(resizeConfig, g_resizeConfigDeleter);
|
||||
int ret = acldvppVpcResizeAsync(dvppChannelDesc_, inputDesc.get(), outputDesc.get(),
|
||||
resizeConfig_.get(), dvppStream_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to resize asynchronously, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
if (withSynchronize) {
|
||||
ret = aclrtSynchronizeStream(dvppStream_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to synchronize stream, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
}
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Crop the image from the input image based on the specified area and
|
||||
* paste the cropped image to the specified position of the target image
|
||||
* as the output image
|
||||
* @param: inputDesc specifies the description information of the input image
|
||||
* @param: outputDesc specifies the description information of the output image
|
||||
* @param: cropRoi specifies the cropped area
|
||||
* @param: pasteRoi specifies the pasting area
|
||||
* @param: withSynchronize specifies whether to execute synchronously
|
||||
* @return: OK if success, other values if failure
|
||||
* @attention: If the width and height of the crop area are different from those of the
|
||||
* paste area, the image is scaled again
|
||||
*/
|
||||
int DvppCommon::ResizeWithPadding(std::shared_ptr<acldvppPicDesc> inputDesc,
|
||||
std::shared_ptr<acldvppPicDesc> outputDesc,
|
||||
const CropRoiConfig &cropRoi, const CropRoiConfig &pasteRoi, bool withSynchronize) {
|
||||
acldvppRoiConfig *cropRoiCfg = acldvppCreateRoiConfig(cropRoi.left, cropRoi.right, cropRoi.up, cropRoi.down);
|
||||
if (cropRoiCfg == nullptr) {
|
||||
std::cout << "Failed to create dvpp roi config for corp area." << std::endl;
|
||||
return INVALID_POINTER;
|
||||
}
|
||||
cropAreaConfig_.reset(cropRoiCfg, g_roiConfigDeleter);
|
||||
|
||||
acldvppRoiConfig *pastRoiCfg = acldvppCreateRoiConfig(pasteRoi.left, pasteRoi.right, pasteRoi.up, pasteRoi.down);
|
||||
if (pastRoiCfg == nullptr) {
|
||||
std::cout << "Failed to create dvpp roi config for paster area." << std::endl;
|
||||
return INVALID_POINTER;
|
||||
}
|
||||
pasteAreaConfig_.reset(pastRoiCfg, g_roiConfigDeleter);
|
||||
|
||||
int ret = acldvppVpcCropAndPasteAsync(dvppChannelDesc_, inputDesc.get(), outputDesc.get(), cropAreaConfig_.get(),
|
||||
pasteAreaConfig_.get(), dvppStream_);
|
||||
if (ret != OK) {
|
||||
// release resource.
|
||||
std::cout << "Failed to crop and paste asynchronously, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
if (withSynchronize) {
|
||||
ret = aclrtSynchronizeStream(dvppStream_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed tp synchronize stream, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
}
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Get crop area
|
||||
* @param: input specifies the input image information
|
||||
* @param: output specifies the output image information
|
||||
* @param: processType specifies whether to perform proportional scaling
|
||||
* @param: cropRoi is used to save the info of the crop roi area
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
void DvppCommon::GetCropRoi(std::shared_ptr<DvppDataInfo> input, std::shared_ptr<DvppDataInfo> output,
|
||||
VpcProcessType processType, CropRoiConfig *cropRoi) {
|
||||
// When processType is not VPC_PT_FILL, crop area is the whole input image
|
||||
if (processType != VPC_PT_FILL) {
|
||||
cropRoi->right = CONVERT_TO_ODD(input->width - ODD_NUM_1);
|
||||
cropRoi->down = CONVERT_TO_ODD(input->height - ODD_NUM_1);
|
||||
return;
|
||||
}
|
||||
|
||||
bool widthRatioSmaller = true;
|
||||
// The scaling ratio is based on the smaller ratio to ensure the smallest edge to fill the targe edge
|
||||
float resizeRatio = static_cast<float>(input->width) / output->width;
|
||||
if (resizeRatio > (static_cast<float>(input->height) / output->height)) {
|
||||
resizeRatio = static_cast<float>(input->height) / output->height;
|
||||
widthRatioSmaller = false;
|
||||
}
|
||||
|
||||
const int halfValue = 2;
|
||||
// The left and up must be even, right and down must be odd which is required by acl
|
||||
if (widthRatioSmaller) {
|
||||
cropRoi->left = 0;
|
||||
cropRoi->right = CONVERT_TO_ODD(input->width - ODD_NUM_1);
|
||||
cropRoi->up = CONVERT_TO_EVEN(static_cast<uint32_t>((input->height - output->height * resizeRatio) /
|
||||
halfValue));
|
||||
cropRoi->down = CONVERT_TO_ODD(input->height - cropRoi->up - ODD_NUM_1);
|
||||
return;
|
||||
}
|
||||
|
||||
cropRoi->up = 0;
|
||||
cropRoi->down = CONVERT_TO_ODD(input->height - ODD_NUM_1);
|
||||
cropRoi->left = CONVERT_TO_EVEN(static_cast<uint32_t>((input->width - output->width * resizeRatio) / halfValue));
|
||||
cropRoi->right = CONVERT_TO_ODD(input->width - cropRoi->left - ODD_NUM_1);
|
||||
return;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Get paste area
|
||||
* @param: input specifies the input image information
|
||||
* @param: output specifies the output image information
|
||||
* @param: processType specifies whether to perform proportional scaling
|
||||
* @param: pasteRio is used to save the info of the paste area
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
void DvppCommon::GetPasteRoi(std::shared_ptr<DvppDataInfo> input, std::shared_ptr<DvppDataInfo> output,
|
||||
VpcProcessType processType, CropRoiConfig *pasteRoi) {
|
||||
if (processType == VPC_PT_FILL) {
|
||||
pasteRoi->right = CONVERT_TO_ODD(output->width - ODD_NUM_1);
|
||||
pasteRoi->down = CONVERT_TO_ODD(output->height - ODD_NUM_1);
|
||||
return;
|
||||
}
|
||||
|
||||
bool widthRatioLarger = true;
|
||||
// The scaling ratio is based on the larger ratio to ensure the largest edge to fill the targe edge
|
||||
float resizeRatio = static_cast<float>(input->width) / output->width;
|
||||
if (resizeRatio < (static_cast<float>(input->height) / output->height)) {
|
||||
resizeRatio = static_cast<float>(input->height) / output->height;
|
||||
widthRatioLarger = false;
|
||||
}
|
||||
|
||||
// Left and up is 0 when the roi paste on the upper left corner
|
||||
if (processType == VPC_PT_PADDING) {
|
||||
pasteRoi->right = (input->width / resizeRatio) - ODD_NUM_1;
|
||||
pasteRoi->down = (input->height / resizeRatio) - ODD_NUM_1;
|
||||
pasteRoi->right = CONVERT_TO_ODD(pasteRoi->right);
|
||||
pasteRoi->down = CONVERT_TO_ODD(pasteRoi->down);
|
||||
return;
|
||||
}
|
||||
|
||||
const int halfValue = 2;
|
||||
// Left and up is 0 when the roi paste on the middler location
|
||||
if (widthRatioLarger) {
|
||||
pasteRoi->left = 0;
|
||||
pasteRoi->right = output->width - ODD_NUM_1;
|
||||
pasteRoi->up = (output->height - (input->height / resizeRatio)) / halfValue;
|
||||
pasteRoi->down = output->height - pasteRoi->up - ODD_NUM_1;
|
||||
} else {
|
||||
pasteRoi->up = 0;
|
||||
pasteRoi->down = output->height - ODD_NUM_1;
|
||||
pasteRoi->left = (output->width - (input->width / resizeRatio)) / halfValue;
|
||||
pasteRoi->right = output->width - pasteRoi->left - ODD_NUM_1;
|
||||
}
|
||||
|
||||
// The left must be even and align to 16, up must be even, right and down must be odd which is required by acl
|
||||
pasteRoi->left = DVPP_ALIGN_UP(CONVERT_TO_EVEN(pasteRoi->left), VPC_WIDTH_ALIGN);
|
||||
pasteRoi->right = CONVERT_TO_ODD(pasteRoi->right);
|
||||
pasteRoi->up = CONVERT_TO_EVEN(pasteRoi->up);
|
||||
pasteRoi->down = CONVERT_TO_ODD(pasteRoi->down);
|
||||
return;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Resize the image specified by input and save the result to member variable resizedImage_
|
||||
* @param: input specifies the input image information
|
||||
* @param: output specifies the output image information
|
||||
* @param: withSynchronize specifies whether to execute synchronously
|
||||
* @param: processType specifies whether to perform proportional scaling, default is non-proportional resize
|
||||
* @return: OK if success, other values if failure
|
||||
* @attention: This function can be called only when the DvppCommon object is initialized with Init
|
||||
*/
|
||||
int DvppCommon::CombineResizeProcess(std::shared_ptr<DvppDataInfo> input, const DvppDataInfo &output,
|
||||
bool withSynchronize, VpcProcessType processType) {
|
||||
int ret = CheckResizeParams(*input, output);
|
||||
if (ret != OK) {
|
||||
return ret;
|
||||
}
|
||||
// Get widthStride and heightStride for input and output image according to the format
|
||||
ret = GetVpcInputStrideSize(input->widthStride, input->heightStride, input->format,
|
||||
&(input->widthStride), &(input->heightStride));
|
||||
if (ret != OK) {
|
||||
return ret;
|
||||
}
|
||||
|
||||
resizedImage_ = std::make_shared<DvppDataInfo>();
|
||||
resizedImage_->width = output.width;
|
||||
resizedImage_->height = output.height;
|
||||
resizedImage_->format = output.format;
|
||||
ret = GetVpcOutputStrideSize(output.width, output.height, output.format, &(resizedImage_->widthStride),
|
||||
&(resizedImage_->heightStride));
|
||||
if (ret != OK) {
|
||||
return ret;
|
||||
}
|
||||
// Get output buffer size for resize output
|
||||
ret = GetVpcDataSize(output.width, output.height, output.format, &(resizedImage_->dataSize));
|
||||
if (ret != OK) {
|
||||
return ret;
|
||||
}
|
||||
// Malloc buffer for output of resize module
|
||||
// Need to pay attention to release of the buffer
|
||||
ret = acldvppMalloc(reinterpret_cast<void **>(&(resizedImage_->data)), resizedImage_->dataSize);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to malloc " << resizedImage_->dataSize << " bytes on dvpp for resize" << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
aclrtMemset(resizedImage_->data, resizedImage_->dataSize, YUV_GREYER_VALUE, resizedImage_->dataSize);
|
||||
resizedImage_->frameId = input->frameId;
|
||||
ret = VpcResize(input, resizedImage_, withSynchronize, processType);
|
||||
if (ret != OK) {
|
||||
// Release the output buffer when resize failed, otherwise release it after use
|
||||
RELEASE_DVPP_DATA(resizedImage_->data);
|
||||
}
|
||||
return ret;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Set the description of the output image and decode
|
||||
* @param: input specifies the input image information
|
||||
* @param: output specifies the output image information
|
||||
* @param: withSynchronize specifies whether to execute synchronously
|
||||
* @return: OK if success, other values if failure
|
||||
* @attention: This function can be called only when the DvppCommon object is initialized with Init
|
||||
*/
|
||||
int DvppCommon::JpegDecode(std::shared_ptr<DvppDataInfo> input,
|
||||
std::shared_ptr<DvppDataInfo> output,
|
||||
bool withSynchronize) {
|
||||
acldvppPicDesc *outputDesc = acldvppCreatePicDesc();
|
||||
decodeOutputDesc_.reset(outputDesc, g_picDescDeleter);
|
||||
|
||||
int ret = SetDvppPicDescData(output, decodeOutputDesc_);
|
||||
if (ret != OK) {
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = acldvppJpegDecodeAsync(dvppChannelDesc_, input->data, input->dataSize, decodeOutputDesc_.get(), dvppStream_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to decode jpeg, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
if (withSynchronize) {
|
||||
ret = aclrtSynchronizeStream(dvppStream_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to synchronize stream, ret = " << ret << "." << std::endl;
|
||||
return DECODE_FAIL;
|
||||
}
|
||||
}
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Get the aligned width and height of the image after decoding
|
||||
* @param: width specifies the width before alignment
|
||||
* @param: height specifies the height before alignment
|
||||
* @param: widthStride is used to save the width after alignment
|
||||
* @param: heightStride is used to save the height after alignment
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
void DvppCommon::GetJpegDecodeStrideSize(uint32_t width, uint32_t height,
|
||||
uint32_t *widthStride, uint32_t *heightStride) {
|
||||
*widthStride = DVPP_ALIGN_UP(width, JPEGD_STRIDE_WIDTH);
|
||||
*heightStride = DVPP_ALIGN_UP(height, JPEGD_STRIDE_HEIGHT);
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Get picture width and height and number of channels from image data
|
||||
* @param: data specifies the memory to store the image data
|
||||
* @param: dataSize specifies the size of the image data
|
||||
* @param: width is used to save the image width
|
||||
* @param: height is used to save the image height
|
||||
* @param: components is used to save the number of channels
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::GetJpegImageInfo(const void *data, uint32_t dataSize, uint32_t *width, uint32_t *height,
|
||||
int32_t *components) {
|
||||
uint32_t widthTmp;
|
||||
uint32_t heightTmp;
|
||||
int32_t componentsTmp;
|
||||
int ret = acldvppJpegGetImageInfo(data, dataSize, &widthTmp, &heightTmp, &componentsTmp);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to get image info of jpeg, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
if (widthTmp > MAX_JPEGD_WIDTH || widthTmp < MIN_JPEGD_WIDTH) {
|
||||
std::cout << "Input width is invalid, not in [" << MIN_JPEGD_WIDTH << ", "
|
||||
<< MAX_JPEGD_WIDTH << "]." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
if (heightTmp > MAX_JPEGD_HEIGHT || heightTmp < MIN_JPEGD_HEIGHT) {
|
||||
std::cout << "Input height is invalid, not in [" << MIN_JPEGD_HEIGHT << ", "
|
||||
<< MAX_JPEGD_HEIGHT << "]." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
*width = widthTmp;
|
||||
*height = heightTmp;
|
||||
*components = componentsTmp;
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Get the size of the buffer for storing decoded images based on the image data, size, and format
|
||||
* @param: data specifies the memory to store the image data
|
||||
* @param: dataSize specifies the size of the image data
|
||||
* @param: format specifies the image format
|
||||
* @param: decSize is used to store the result size
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::GetJpegDecodeDataSize(const void *data, uint32_t dataSize, acldvppPixelFormat format,
|
||||
uint32_t *decSize) {
|
||||
uint32_t outputSize;
|
||||
int ret = acldvppJpegPredictDecSize(data, dataSize, format, &outputSize);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to predict decode size of jpeg image, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
*decSize = outputSize;
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Decode the image specified by imageInfo and save the result to member variable decodedImage_
|
||||
* @param: imageInfo specifies image information
|
||||
* @param: format specifies the image format
|
||||
* @param: withSynchronize specifies whether to execute synchronously
|
||||
* @return: OK if success, other values if failure
|
||||
* @attention: This function can be called only when the DvppCommon object is initialized with Init
|
||||
*/
|
||||
int DvppCommon::CombineJpegdProcess(const RawData& imageInfo, acldvppPixelFormat format, bool withSynchronize) {
|
||||
int32_t components;
|
||||
inputImage_ = std::make_shared<DvppDataInfo>();
|
||||
inputImage_->format = format;
|
||||
int ret = GetJpegImageInfo(imageInfo.data.get(), imageInfo.lenOfByte, &(inputImage_->width), &(inputImage_->height),
|
||||
&components);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to get input image info, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
// Get the buffer size of decode output according to the input data and output format
|
||||
uint32_t outBuffSize;
|
||||
ret = GetJpegDecodeDataSize(imageInfo.data.get(), imageInfo.lenOfByte, format, &outBuffSize);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to get size of decode output buffer, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
// In TransferImageH2D function, device buffer will be allocated to store the input image
|
||||
// Need to pay attention to release of the buffer
|
||||
ret = TransferImageH2D(imageInfo, inputImage_);
|
||||
if (ret != OK) {
|
||||
return ret;
|
||||
}
|
||||
|
||||
decodedImage_ = std::make_shared<DvppDataInfo>();
|
||||
decodedImage_->format = format;
|
||||
decodedImage_->width = inputImage_->width;
|
||||
decodedImage_->height = inputImage_->height;
|
||||
GetJpegDecodeStrideSize(inputImage_->width, inputImage_->height, &(decodedImage_->widthStride),
|
||||
&(decodedImage_->heightStride));
|
||||
decodedImage_->dataSize = outBuffSize;
|
||||
// Need to pay attention to release of the buffer
|
||||
ret = acldvppMalloc(reinterpret_cast<void **>(&decodedImage_->data), decodedImage_->dataSize);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to malloc memory on dvpp, ret = " << ret << "." << std::endl;
|
||||
RELEASE_DVPP_DATA(inputImage_->data);
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = JpegDecode(inputImage_, decodedImage_, withSynchronize);
|
||||
if (ret != OK) {
|
||||
RELEASE_DVPP_DATA(inputImage_->data);
|
||||
inputImage_->data = nullptr;
|
||||
RELEASE_DVPP_DATA(decodedImage_->data);
|
||||
decodedImage_->data = nullptr;
|
||||
return ret;
|
||||
}
|
||||
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Transfer data from host to device
|
||||
* @param: imageInfo specifies the image data on the host
|
||||
* @param: jpegInput is used to save the buffer and its size which is allocate on the device
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::TransferImageH2D(const RawData& imageInfo, const std::shared_ptr<DvppDataInfo>& jpegInput) {
|
||||
if (imageInfo.lenOfByte == 0) {
|
||||
std::cout << "The input buffer size on host should not be empty." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
|
||||
uint8_t* inDevBuff = nullptr;
|
||||
int ret = acldvppMalloc(reinterpret_cast<void **>(&inDevBuff), imageInfo.lenOfByte);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to malloc " << imageInfo.lenOfByte << " bytes on dvpp, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
// Copy the image data from host to device
|
||||
ret = aclrtMemcpyAsync(inDevBuff, imageInfo.lenOfByte, imageInfo.data.get(), imageInfo.lenOfByte,
|
||||
ACL_MEMCPY_HOST_TO_DEVICE, dvppStream_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to copy " << imageInfo.lenOfByte << " bytes from host to device" << std::endl;
|
||||
RELEASE_DVPP_DATA(inDevBuff);
|
||||
return ret;
|
||||
}
|
||||
// Attention: We must call the aclrtSynchronizeStream to ensure the task of memory replication has been completed
|
||||
// after calling aclrtMemcpyAsync
|
||||
ret = aclrtSynchronizeStream(dvppStream_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to synchronize stream, ret = " << ret << "." << std::endl;
|
||||
RELEASE_DVPP_DATA(inDevBuff);
|
||||
return ret;
|
||||
}
|
||||
jpegInput->data = inDevBuff;
|
||||
jpegInput->dataSize = imageInfo.lenOfByte;
|
||||
return OK;
|
||||
}
|
||||
|
||||
std::shared_ptr<DvppDataInfo> DvppCommon::GetInputImage() {
|
||||
return inputImage_;
|
||||
}
|
||||
|
||||
std::shared_ptr<DvppDataInfo> DvppCommon::GetDecodedImage() {
|
||||
return decodedImage_;
|
||||
}
|
||||
|
||||
std::shared_ptr<DvppDataInfo> DvppCommon::GetResizedImage() {
|
||||
return resizedImage_;
|
||||
}
|
||||
|
||||
DvppCommon::~DvppCommon() {}
|
|
@ -1,226 +0,0 @@
|
|||
/*
|
||||
* Copyright(C) 2020. Huawei Technologies Co.,Ltd. All rights reserved.
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#include <sys/time.h>
|
||||
#include <fstream>
|
||||
#include "../inc/ModelProcess.h"
|
||||
|
||||
ModelProcess::ModelProcess(const int deviceId) {
|
||||
deviceId_ = deviceId;
|
||||
}
|
||||
|
||||
ModelProcess::ModelProcess() {}
|
||||
|
||||
ModelProcess::~ModelProcess() {
|
||||
if (!isDeInit_) {
|
||||
DeInit();
|
||||
}
|
||||
}
|
||||
|
||||
void ModelProcess::DestroyDataset(aclmdlDataset *dataset) {
|
||||
// Just release the DataBuffer object and DataSet object, remain the buffer, because it is managerd by user
|
||||
if (dataset != nullptr) {
|
||||
for (size_t i = 0; i < aclmdlGetDatasetNumBuffers(dataset); i++) {
|
||||
aclDataBuffer* dataBuffer = aclmdlGetDatasetBuffer(dataset, i);
|
||||
if (dataBuffer != nullptr) {
|
||||
aclDestroyDataBuffer(dataBuffer);
|
||||
dataBuffer = nullptr;
|
||||
}
|
||||
}
|
||||
aclmdlDestroyDataset(dataset);
|
||||
}
|
||||
}
|
||||
|
||||
aclmdlDesc *ModelProcess::GetModelDesc() {
|
||||
return modelDesc_.get();
|
||||
}
|
||||
|
||||
int ModelProcess::ModelInference(const std::vector<void *> &inputBufs,
|
||||
const std::vector<size_t> &inputSizes,
|
||||
const std::vector<void *> &ouputBufs,
|
||||
const std::vector<size_t> &outputSizes,
|
||||
std::map<double, double> *costTime_map) {
|
||||
std::cout << "ModelProcess:Begin to inference." << std::endl;
|
||||
aclmdlDataset *input = nullptr;
|
||||
input = CreateAndFillDataset(inputBufs, inputSizes);
|
||||
if (input == nullptr) {
|
||||
return INVALID_POINTER;
|
||||
}
|
||||
int ret;
|
||||
|
||||
aclmdlDataset *output = nullptr;
|
||||
output = CreateAndFillDataset(ouputBufs, outputSizes);
|
||||
if (output == nullptr) {
|
||||
DestroyDataset(input);
|
||||
input = nullptr;
|
||||
return INVALID_POINTER;
|
||||
}
|
||||
struct timeval start;
|
||||
struct timeval end;
|
||||
double startTime_ms;
|
||||
double endTime_ms;
|
||||
mtx_.lock();
|
||||
gettimeofday(&start, NULL);
|
||||
ret = aclmdlExecute(modelId_, input, output);
|
||||
gettimeofday(&end, NULL);
|
||||
startTime_ms = (1.0 * start.tv_sec * 1000000 + start.tv_usec) / 1000;
|
||||
endTime_ms = (1.0 * end.tv_sec * 1000000 + end.tv_usec) / 1000;
|
||||
costTime_map->insert(std::pair<double, double>(startTime_ms, endTime_ms));
|
||||
mtx_.unlock();
|
||||
if (ret != OK) {
|
||||
std::cout << "aclmdlExecute failed, ret[" << ret << "]." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
DestroyDataset(input);
|
||||
DestroyDataset(output);
|
||||
return OK;
|
||||
}
|
||||
|
||||
int ModelProcess::DeInit() {
|
||||
isDeInit_ = true;
|
||||
int ret = aclmdlUnload(modelId_);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclmdlUnload failed, ret["<< ret << "]." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
if (modelDevPtr_ != nullptr) {
|
||||
ret = aclrtFree(modelDevPtr_);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclrtFree failed, ret[" << ret << "]." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
modelDevPtr_ = nullptr;
|
||||
}
|
||||
if (weightDevPtr_ != nullptr) {
|
||||
ret = aclrtFree(weightDevPtr_);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclrtFree failed, ret[" << ret << "]." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
weightDevPtr_ = nullptr;
|
||||
}
|
||||
|
||||
return OK;
|
||||
}
|
||||
/**
|
||||
* Read a binary file, store the data into a uint8_t array
|
||||
*
|
||||
* @param fileName the file for reading
|
||||
* @param buffShared a shared pointer to a uint8_t array for storing file
|
||||
* @param buffLength the length of the array
|
||||
* @return OK if create success, error code otherwise
|
||||
*/
|
||||
int ModelProcess::ReadBinaryFile(const std::string &fileName, uint8_t **buffShared, int *buffLength) {
|
||||
std::ifstream inFile(fileName, std::ios::in | std::ios::binary);
|
||||
if (!inFile) {
|
||||
std::cout << "FaceFeatureLib: read file " << fileName << " fail." <<std::endl;
|
||||
return READ_FILE_FAIL;
|
||||
}
|
||||
|
||||
inFile.seekg(0, inFile.end);
|
||||
*buffLength = inFile.tellg();
|
||||
inFile.seekg(0, inFile.beg);
|
||||
|
||||
uint8_t *tempShared = reinterpret_cast<uint8_t *>(malloc(*buffLength));
|
||||
inFile.read(reinterpret_cast<char *>(tempShared), *buffLength);
|
||||
inFile.close();
|
||||
*buffShared = tempShared;
|
||||
|
||||
std::cout << "read file: fileName=" << fileName << ", size=" << *buffLength << "." << std::endl;
|
||||
|
||||
return OK;
|
||||
}
|
||||
|
||||
int ModelProcess::Init(const std::string &modelPath) {
|
||||
std::cout << "ModelProcess:Begin to init instance." << std::endl;
|
||||
int modelSize = 0;
|
||||
uint8_t *modelData = nullptr;
|
||||
int ret = ReadBinaryFile(modelPath, &modelData, &modelSize);
|
||||
if (ret != OK) {
|
||||
std::cout << "read model file failed, ret[" << ret << "]." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = aclmdlQuerySizeFromMem(modelData, modelSize, &modelDevPtrSize_, &weightDevPtrSize_);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclmdlQuerySizeFromMem failed, ret[" << ret << "]." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
std::cout << "modelDevPtrSize_[" << modelDevPtrSize_ << "]" << std::endl;
|
||||
std::cout << " weightDevPtrSize_[" << weightDevPtrSize_ << "]." << std::endl;
|
||||
|
||||
ret = aclrtMalloc(&modelDevPtr_, modelDevPtrSize_, ACL_MEM_MALLOC_HUGE_FIRST);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclrtMalloc dev_ptr failed, ret[" << ret << "]." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = aclrtMalloc(&weightDevPtr_, weightDevPtrSize_, ACL_MEM_MALLOC_HUGE_FIRST);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclrtMalloc weight_ptr failed, ret[" << ret << "] " << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = aclmdlLoadFromMemWithMem(modelData, modelSize, &modelId_, modelDevPtr_, modelDevPtrSize_,
|
||||
weightDevPtr_, weightDevPtrSize_);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclmdlLoadFromMemWithMem failed, ret[" << ret << "]." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = aclrtGetCurrentContext(&contextModel_);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclrtMalloc weight_ptr failed, ret[" << ret << "]." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
aclmdlDesc *modelDesc = aclmdlCreateDesc();
|
||||
if (modelDesc == nullptr) {
|
||||
std::cout << "aclmdlCreateDesc failed." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = aclmdlGetDesc(modelDesc, modelId_);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclmdlGetDesc ret fail, ret:" << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
modelDesc_.reset(modelDesc, aclmdlDestroyDesc);
|
||||
free(modelData);
|
||||
return OK;
|
||||
}
|
||||
|
||||
aclmdlDataset *ModelProcess::CreateAndFillDataset(const std::vector<void *> &bufs, const std::vector<size_t> &sizes) {
|
||||
aclmdlDataset *dataset = aclmdlCreateDataset();
|
||||
if (dataset == nullptr) {
|
||||
std::cout << "ACL_ModelInputCreate failed." << std::endl;
|
||||
return nullptr;
|
||||
}
|
||||
|
||||
for (size_t i = 0; i < bufs.size(); ++i) {
|
||||
aclDataBuffer *data = aclCreateDataBuffer(bufs[i], sizes[i]);
|
||||
if (data == nullptr) {
|
||||
DestroyDataset(dataset);
|
||||
std::cout << "aclCreateDataBuffer failed." << std::endl;
|
||||
return nullptr;
|
||||
}
|
||||
|
||||
int ret = aclmdlAddDatasetBuffer(dataset, data);
|
||||
if (ret != OK) {
|
||||
DestroyDataset(dataset);
|
||||
std::cout << "ACL_ModelInputDataAdd failed, ret[" << ret << "]." << std::endl;
|
||||
return nullptr;
|
||||
}
|
||||
}
|
||||
return dataset;
|
||||
}
|
|
@ -1,56 +0,0 @@
|
|||
#!/bin/bash
|
||||
# Copyright 2020 Huawei Technologies Co., Ltd
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
# ============================================================================
|
||||
path_cur=$(cd "`dirname $0`" || exit; pwd)
|
||||
build_type="Release"
|
||||
|
||||
function preparePath() {
|
||||
rm -rf $1
|
||||
mkdir -p $1
|
||||
cd $1 || exit
|
||||
}
|
||||
|
||||
function buildA300() {
|
||||
if [ ! "${ARCH_PATTERN}" ]; then
|
||||
# set ARCH_PATTERN to acllib when it was not specified by user
|
||||
export ARCH_PATTERN=acllib
|
||||
echo "ARCH_PATTERN is set to the default value: ${ARCH_PATTERN}"
|
||||
else
|
||||
echo "ARCH_PATTERN is set to ${ARCH_PATTERN} by user, reset it to ${ARCH_PATTERN}/acllib"
|
||||
export ARCH_PATTERN=${ARCH_PATTERN}/acllib
|
||||
fi
|
||||
|
||||
path_build=$path_cur/build
|
||||
preparePath $path_build
|
||||
cmake -DCMAKE_BUILD_TYPE=$build_type ..
|
||||
make -j
|
||||
ret=$?
|
||||
cd ..
|
||||
return ${ret}
|
||||
}
|
||||
|
||||
# set ASCEND_VERSION to ascend-toolkit/latest when it was not specified by user
|
||||
if [ ! "${ASCEND_VERSION}" ]; then
|
||||
export ASCEND_VERSION=ascend-toolkit/latest
|
||||
echo "Set ASCEND_VERSION to the default value: ${ASCEND_VERSION}"
|
||||
else
|
||||
echo "ASCEND_VERSION is set to ${ASCEND_VERSION} by user"
|
||||
fi
|
||||
|
||||
buildA300
|
||||
|
||||
if [ $? -ne 0 ]; then
|
||||
exit 1
|
||||
fi
|
|
@ -0,0 +1,236 @@
|
|||
/**
|
||||
* Copyright 2021 Huawei Technologies Co., Ltd
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
#include <sys/time.h>
|
||||
#include <gflags/gflags.h>
|
||||
#include <dirent.h>
|
||||
#include <iostream>
|
||||
#include <string>
|
||||
#include <algorithm>
|
||||
#include <iosfwd>
|
||||
#include <vector>
|
||||
#include <fstream>
|
||||
#include <sstream>
|
||||
|
||||
#include "include/api/context.h"
|
||||
#include "include/api/model.h"
|
||||
#include "include/api/types.h"
|
||||
#include "include/api/serialization.h"
|
||||
#include "include/minddata/dataset/include/vision.h"
|
||||
#include "include/minddata/dataset/include/execute.h"
|
||||
#include "../inc/utils.h"
|
||||
|
||||
using mindspore::Context;
|
||||
using mindspore::Serialization;
|
||||
using mindspore::Model;
|
||||
using mindspore::Status;
|
||||
using mindspore::ModelType;
|
||||
using mindspore::GraphCell;
|
||||
using mindspore::kSuccess;
|
||||
using mindspore::MSTensor;
|
||||
using mindspore::DataType;
|
||||
using mindspore::dataset::Execute;
|
||||
using mindspore::dataset::TensorTransform;
|
||||
using mindspore::dataset::vision::Resize;
|
||||
using mindspore::dataset::vision::Pad;
|
||||
using mindspore::dataset::vision::HWC2CHW;
|
||||
using mindspore::dataset::vision::Normalize;
|
||||
using mindspore::dataset::vision::SwapRedBlue;
|
||||
using mindspore::dataset::vision::Decode;
|
||||
|
||||
|
||||
DEFINE_string(mindir_path, "", "mindir path");
|
||||
DEFINE_string(dataset_path, ".", "dataset path");
|
||||
DEFINE_int32(device_id, 0, "device id");
|
||||
|
||||
const int IMAGEWIDTH = 1280;
|
||||
const int IMAGEHEIGHT = 768;
|
||||
|
||||
int PadImage(const MSTensor &input, MSTensor *output) {
|
||||
std::shared_ptr<TensorTransform> normalize(new Normalize({103.53, 116.28, 123.675},
|
||||
{57.375, 57.120, 58.395}));
|
||||
Execute composeNormalize({normalize});
|
||||
std::vector<int64_t> shape = input.Shape();
|
||||
auto imgResize = MSTensor();
|
||||
auto imgPad = MSTensor();
|
||||
|
||||
float widthScale, heightScale;
|
||||
widthScale = static_cast<float>(IMAGEWIDTH) / shape[1];
|
||||
heightScale = static_cast<float>(IMAGEHEIGHT) / shape[0];
|
||||
Status ret;
|
||||
if (widthScale < heightScale) {
|
||||
int heightSize = shape[0]*widthScale;
|
||||
std::shared_ptr<TensorTransform> resize(new Resize({heightSize, IMAGEWIDTH}));
|
||||
Execute composeResizeWidth({resize});
|
||||
ret = composeResizeWidth(input, &imgResize);
|
||||
if (ret != kSuccess) {
|
||||
std::cout << "ERROR: Resize Width failed." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
|
||||
int paddingSize = IMAGEHEIGHT - heightSize;
|
||||
std::shared_ptr<TensorTransform> pad(new Pad({0, 0, 0, paddingSize}));
|
||||
Execute composePad({pad});
|
||||
ret = composePad(imgResize, &imgPad);
|
||||
if (ret != kSuccess) {
|
||||
std::cout << "ERROR: Height Pad failed." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
|
||||
ret = composeNormalize(imgPad, output);
|
||||
if (ret != kSuccess) {
|
||||
std::cout << "ERROR: Normalize failed." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
} else {
|
||||
int widthSize = shape[1]*heightScale;
|
||||
std::shared_ptr<TensorTransform> resize(new Resize({IMAGEHEIGHT, widthSize}));
|
||||
Execute composeResizeHeight({resize});
|
||||
ret = composeResizeHeight(input, &imgResize);
|
||||
if (ret != kSuccess) {
|
||||
std::cout << "ERROR: Resize Height failed." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
|
||||
int paddingSize = IMAGEWIDTH - widthSize;
|
||||
std::shared_ptr<TensorTransform> pad(new Pad({0, 0, paddingSize, 0}));
|
||||
Execute composePad({pad});
|
||||
ret = composePad(imgResize, &imgPad);
|
||||
if (ret != kSuccess) {
|
||||
std::cout << "ERROR: Width Pad failed." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
|
||||
ret = composeNormalize(imgPad, output);
|
||||
if (ret != kSuccess) {
|
||||
std::cout << "ERROR: Normalize failed." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
}
|
||||
return 0;
|
||||
}
|
||||
|
||||
int main(int argc, char **argv) {
|
||||
gflags::ParseCommandLineFlags(&argc, &argv, true);
|
||||
if (RealPath(FLAGS_mindir_path).empty()) {
|
||||
std::cout << "Invalid mindir" << std::endl;
|
||||
return 1;
|
||||
}
|
||||
|
||||
auto context = std::make_shared<Context>();
|
||||
auto ascend310 = std::make_shared<mindspore::Ascend310DeviceInfo>();
|
||||
ascend310->SetDeviceID(FLAGS_device_id);
|
||||
ascend310->SetPrecisionMode("allow_fp32_to_fp16");
|
||||
context->MutableDeviceInfo().push_back(ascend310);
|
||||
mindspore::Graph graph;
|
||||
Serialization::Load(FLAGS_mindir_path, ModelType::kMindIR, &graph);
|
||||
|
||||
Model model;
|
||||
Status ret = model.Build(GraphCell(graph), context);
|
||||
if (ret != kSuccess) {
|
||||
std::cout << "ERROR: Build failed." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
std::vector<MSTensor> model_inputs = model.GetInputs();
|
||||
if (model_inputs.empty()) {
|
||||
std::cout << "Invalid model, inputs is empty." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
|
||||
auto all_files = GetAllFiles(FLAGS_dataset_path);
|
||||
if (all_files.empty()) {
|
||||
std::cout << "ERROR: no input data." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
|
||||
std::map<double, double> costTime_map;
|
||||
size_t size = all_files.size();
|
||||
std::shared_ptr<TensorTransform> decode(new Decode());
|
||||
Execute composeDecode({decode});
|
||||
std::shared_ptr<TensorTransform> hwc2chw(new HWC2CHW());
|
||||
Execute composeTranspose({hwc2chw});
|
||||
|
||||
for (size_t i = 0; i < size; ++i) {
|
||||
struct timeval start = {0};
|
||||
struct timeval end = {0};
|
||||
double startTimeMs;
|
||||
double endTimeMs;
|
||||
std::vector<MSTensor> inputs;
|
||||
std::vector<MSTensor> outputs;
|
||||
std::cout << "Start predict input files:" << all_files[i] << std::endl;
|
||||
auto imgDecode = MSTensor();
|
||||
auto image = ReadFileToTensor(all_files[i]);
|
||||
ret = composeDecode(image, &imgDecode);
|
||||
if (ret != kSuccess) {
|
||||
std::cout << "ERROR: Decode failed." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
auto imgPad = MSTensor();
|
||||
PadImage(imgDecode, &imgPad);
|
||||
auto img = MSTensor();
|
||||
composeTranspose(imgPad, &img);
|
||||
|
||||
std::vector<int64_t> shape = imgDecode.Shape();
|
||||
|
||||
float widthScale = static_cast<float>(IMAGEWIDTH) / shape[1];
|
||||
float heightScale = static_cast<float>(IMAGEHEIGHT) / shape[0];
|
||||
float resizeScale = widthScale < heightScale ? widthScale : heightScale;
|
||||
|
||||
float imgInfo[4];
|
||||
imgInfo[0] = shape[0];
|
||||
imgInfo[1] = shape[1];
|
||||
imgInfo[2] = resizeScale;
|
||||
imgInfo[3] = resizeScale;
|
||||
|
||||
MSTensor imgMeta("imgMeta", DataType::kNumberTypeFloat32, {static_cast<int64_t>(4)}, imgInfo, 16);
|
||||
|
||||
inputs.emplace_back(model_inputs[0].Name(), model_inputs[0].DataType(), model_inputs[0].Shape(),
|
||||
img.Data().get(), img.DataSize());
|
||||
inputs.emplace_back(model_inputs[1].Name(), model_inputs[1].DataType(), model_inputs[1].Shape(),
|
||||
imgMeta.Data().get(), imgMeta.DataSize());
|
||||
|
||||
gettimeofday(&start, nullptr);
|
||||
ret = model.Predict(inputs, &outputs);
|
||||
gettimeofday(&end, nullptr);
|
||||
if (ret != kSuccess) {
|
||||
std::cout << "Predict " << all_files[i] << " failed." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
startTimeMs = (1.0 * start.tv_sec * 1000000 + start.tv_usec) / 1000;
|
||||
endTimeMs = (1.0 * end.tv_sec * 1000000 + end.tv_usec) / 1000;
|
||||
costTime_map.insert(std::pair<double, double>(startTimeMs, endTimeMs));
|
||||
WriteResult(all_files[i], outputs);
|
||||
}
|
||||
double average = 0.0;
|
||||
int inferCount = 0;
|
||||
|
||||
for (auto iter = costTime_map.begin(); iter != costTime_map.end(); iter++) {
|
||||
double diff = 0.0;
|
||||
diff = iter->second - iter->first;
|
||||
average += diff;
|
||||
inferCount++;
|
||||
}
|
||||
average = average / inferCount;
|
||||
std::stringstream timeCost;
|
||||
timeCost << "NN inference cost average time: "<< average << " ms of infer_count " << inferCount << std::endl;
|
||||
std::cout << "NN inference cost average time: "<< average << "ms of infer_count " << inferCount << std::endl;
|
||||
|
||||
std::string fileName = "./time_Result" + std::string("/test_perform_static.txt");
|
||||
std::ofstream fileStream(fileName.c_str(), std::ios::trunc);
|
||||
fileStream << timeCost.str();
|
||||
fileStream.close();
|
||||
costTime_map.clear();
|
||||
return 0;
|
||||
}
|
|
@ -1,136 +0,0 @@
|
|||
/*
|
||||
* Copyright (c) 2020.Huawei Technologies Co., Ltd. All rights reserved.
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
#include <dirent.h>
|
||||
#include <sys/stat.h>
|
||||
#include <gflags/gflags.h>
|
||||
#include <unistd.h>
|
||||
#include <cstring>
|
||||
#include <fstream>
|
||||
#include <sstream>
|
||||
#include "../inc/AclProcess.h"
|
||||
#include "../inc/CommonDataType.h"
|
||||
|
||||
DEFINE_string(om_path, "./fasterrcnn.om", "om model path.");
|
||||
DEFINE_string(data_path, "./test.jpg", "om model path.");
|
||||
DEFINE_int32(width, 1280, "width");
|
||||
DEFINE_int32(height, 768, "height");
|
||||
DEFINE_int32(device_id, 0, "height");
|
||||
|
||||
static bool is_file(const std::string &filename) {
|
||||
struct stat buffer;
|
||||
return (stat(filename.c_str(), &buffer) == 0 && S_ISREG(buffer.st_mode));
|
||||
}
|
||||
|
||||
static bool is_dir(const std::string &filefodler) {
|
||||
struct stat buffer;
|
||||
return (stat(filefodler.c_str(), &buffer) == 0 && S_ISDIR(buffer.st_mode));
|
||||
}
|
||||
/*
|
||||
* @description Initialize and run AclProcess module
|
||||
* @param resourceInfo resource info of deviceIds, model info, single Operator Path, etc
|
||||
* @param file the absolute path of input file
|
||||
* @return int int code
|
||||
*/
|
||||
int main(int argc, char* argv[]) {
|
||||
gflags::ParseCommandLineFlags(&argc, &argv, true);
|
||||
std::cout << "OM File Path :" << FLAGS_om_path << std::endl;
|
||||
std::cout << "data Path :" << FLAGS_data_path << std::endl;
|
||||
std::cout << "width :" << FLAGS_width << std::endl;
|
||||
std::cout << "height :" << FLAGS_height << std::endl;
|
||||
std::cout << "deviceId :" << FLAGS_device_id << std::endl;
|
||||
|
||||
char omAbsPath[PATH_MAX];
|
||||
if (realpath(FLAGS_om_path.c_str(), omAbsPath) == nullptr) {
|
||||
std::cout << "Failed to get the om real path." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
|
||||
if (access(omAbsPath, R_OK) == -1) {
|
||||
std::cout << "ModelPath " << omAbsPath << " doesn't exist or read failed." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
|
||||
char dataAbsPath[PATH_MAX];
|
||||
if (realpath(FLAGS_data_path.c_str(), dataAbsPath) == nullptr) {
|
||||
std::cout << "Failed to get the data real path." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
if (access(dataAbsPath, R_OK) == -1) {
|
||||
std::cout << "data paeh " << dataAbsPath << " doesn't exist or read failed." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
|
||||
std::map<double, double> costTime_map;
|
||||
AclProcess aclProcess(FLAGS_device_id, FLAGS_om_path, FLAGS_width, FLAGS_height);
|
||||
int ret = aclProcess.InitResource();
|
||||
if (ret != OK) {
|
||||
aclProcess.Release();
|
||||
return ret;
|
||||
}
|
||||
if (is_file(FLAGS_data_path)) {
|
||||
ret = aclProcess.Process(FLAGS_data_path, &costTime_map);
|
||||
if (ret != OK) {
|
||||
std::cout << "model process failed, errno = " << ret << std::endl;
|
||||
aclProcess.Release();
|
||||
return ret;
|
||||
}
|
||||
} else if (is_dir(FLAGS_data_path)) {
|
||||
struct dirent *filename;
|
||||
DIR *dir;
|
||||
dir = opendir(FLAGS_data_path.c_str());
|
||||
if (dir == nullptr) {
|
||||
aclProcess.Release();
|
||||
return ERROR;
|
||||
}
|
||||
|
||||
while ((filename = readdir(dir)) != nullptr) {
|
||||
if (strcmp(filename->d_name, ".") == 0 || strcmp(filename->d_name, "..") == 0) {
|
||||
continue;
|
||||
}
|
||||
std::string wholePath = FLAGS_data_path + "/" + filename->d_name;
|
||||
ret = aclProcess.Process(wholePath, &costTime_map);
|
||||
if (ret != OK) {
|
||||
std::cout << "model process failed, errno = " << ret << std::endl;
|
||||
aclProcess.Release();
|
||||
return ret;
|
||||
}
|
||||
}
|
||||
} else {
|
||||
std::cout << " input image path error" << std::endl;
|
||||
}
|
||||
|
||||
double average = 0.0;
|
||||
int infer_cnt = 0;
|
||||
for (auto iter = costTime_map.begin(); iter != costTime_map.end(); iter++) {
|
||||
double diff = 0.0;
|
||||
diff = iter->second - iter->first;
|
||||
average += diff;
|
||||
infer_cnt++;
|
||||
}
|
||||
average = average / infer_cnt;
|
||||
|
||||
std::stringstream timeCost;
|
||||
timeCost << "NN inference cost average time: "<< average << " ms of infer_count " << infer_cnt << std::endl;
|
||||
std::cout << "NN inference cost average time: "<< average << "ms of infer_count " << infer_cnt << std::endl;
|
||||
|
||||
std::string file_name = "./time_Result" + std::string("/test_perform_static.txt");
|
||||
std::ofstream file_stream(file_name.c_str(), std::ios::trunc);
|
||||
file_stream << timeCost.str();
|
||||
file_stream.close();
|
||||
costTime_map.clear();
|
||||
|
||||
aclProcess.Release();
|
||||
return OK;
|
||||
}
|
|
@ -0,0 +1,129 @@
|
|||
/**
|
||||
* Copyright 2021 Huawei Technologies Co., Ltd
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#include <fstream>
|
||||
#include <algorithm>
|
||||
#include <iostream>
|
||||
#include "../inc/utils.h"
|
||||
|
||||
using mindspore::MSTensor;
|
||||
using mindspore::DataType;
|
||||
|
||||
std::vector<std::string> GetAllFiles(std::string_view dirName) {
|
||||
struct dirent *filename;
|
||||
DIR *dir = OpenDir(dirName);
|
||||
if (dir == nullptr) {
|
||||
return {};
|
||||
}
|
||||
std::vector<std::string> res;
|
||||
while ((filename = readdir(dir)) != nullptr) {
|
||||
std::string dName = std::string(filename->d_name);
|
||||
if (dName == "." || dName == ".." || filename->d_type != DT_REG) {
|
||||
continue;
|
||||
}
|
||||
res.emplace_back(std::string(dirName) + "/" + filename->d_name);
|
||||
}
|
||||
std::sort(res.begin(), res.end());
|
||||
for (auto &f : res) {
|
||||
std::cout << "image file: " << f << std::endl;
|
||||
}
|
||||
return res;
|
||||
}
|
||||
|
||||
int WriteResult(const std::string& imageFile, const std::vector<MSTensor> &outputs) {
|
||||
std::string homePath = "./result_Files";
|
||||
for (size_t i = 0; i < outputs.size(); ++i) {
|
||||
size_t outputSize;
|
||||
std::shared_ptr<const void> netOutput;
|
||||
netOutput = outputs[i].Data();
|
||||
outputSize = outputs[i].DataSize();
|
||||
int pos = imageFile.rfind('/');
|
||||
std::string fileName(imageFile, pos + 1);
|
||||
fileName.replace(fileName.find('.'), fileName.size() - fileName.find('.'), '_' + std::to_string(i) + ".bin");
|
||||
std::string outFileName = homePath + "/" + fileName;
|
||||
FILE * outputFile = fopen(outFileName.c_str(), "wb");
|
||||
fwrite(netOutput.get(), outputSize, sizeof(char), outputFile);
|
||||
fclose(outputFile);
|
||||
outputFile = nullptr;
|
||||
}
|
||||
return 0;
|
||||
}
|
||||
|
||||
MSTensor ReadFileToTensor(const std::string &file) {
|
||||
if (file.empty()) {
|
||||
std::cout << "Pointer file is nullptr" << std::endl;
|
||||
return MSTensor();
|
||||
}
|
||||
|
||||
std::ifstream ifs(file);
|
||||
if (!ifs.good()) {
|
||||
std::cout << "File: " << file << " is not exist" << std::endl;
|
||||
return MSTensor();
|
||||
}
|
||||
|
||||
if (!ifs.is_open()) {
|
||||
std::cout << "File: " << file << "open failed" << std::endl;
|
||||
return MSTensor();
|
||||
}
|
||||
|
||||
ifs.seekg(0, std::ios::end);
|
||||
size_t size = ifs.tellg();
|
||||
MSTensor buffer(file, mindspore::DataType::kNumberTypeUInt8, {static_cast<int64_t>(size)}, nullptr, size);
|
||||
|
||||
ifs.seekg(0, std::ios::beg);
|
||||
ifs.read(reinterpret_cast<char *>(buffer.MutableData()), size);
|
||||
ifs.close();
|
||||
|
||||
return buffer;
|
||||
}
|
||||
|
||||
|
||||
DIR *OpenDir(std::string_view dirName) {
|
||||
if (dirName.empty()) {
|
||||
std::cout << " dirName is null ! " << std::endl;
|
||||
return nullptr;
|
||||
}
|
||||
std::string realPath = RealPath(dirName);
|
||||
struct stat s;
|
||||
lstat(realPath.c_str(), &s);
|
||||
if (!S_ISDIR(s.st_mode)) {
|
||||
std::cout << "dirName is not a valid directory !" << std::endl;
|
||||
return nullptr;
|
||||
}
|
||||
DIR *dir;
|
||||
dir = opendir(realPath.c_str());
|
||||
if (dir == nullptr) {
|
||||
std::cout << "Can not open dir " << dirName << std::endl;
|
||||
return nullptr;
|
||||
}
|
||||
std::cout << "Successfully opened the dir " << dirName << std::endl;
|
||||
return dir;
|
||||
}
|
||||
|
||||
std::string RealPath(std::string_view path) {
|
||||
char realPathMem[PATH_MAX] = {0};
|
||||
char *realPathRet = nullptr;
|
||||
realPathRet = realpath(path.data(), realPathMem);
|
||||
|
||||
if (realPathRet == nullptr) {
|
||||
std::cout << "File: " << path << " is not exist.";
|
||||
return "";
|
||||
}
|
||||
|
||||
std::string realPath(realPathMem);
|
||||
std::cout << path << " realpath is: " << realPath << std::endl;
|
||||
return realPath;
|
||||
}
|
|
@ -13,6 +13,7 @@
|
|||
# limitations under the License.
|
||||
# ============================================================================
|
||||
"""post process for 310 inference"""
|
||||
import os
|
||||
import argparse
|
||||
import numpy as np
|
||||
from pycocotools.coco import COCO
|
||||
|
@ -25,13 +26,13 @@ dst_height = 768
|
|||
|
||||
parser = argparse.ArgumentParser(description="FasterRcnn inference")
|
||||
parser.add_argument("--ann_file", type=str, required=True, help="ann file.")
|
||||
parser.add_argument("--img_path", type=str, required=True, help="image file path.")
|
||||
parser.add_argument("--result_path", type=str, required=True, help="result file path.")
|
||||
args = parser.parse_args()
|
||||
|
||||
def get_eval_result(ann_file):
|
||||
def get_eval_result(ann_file, result_path):
|
||||
""" get evaluation result of faster rcnn"""
|
||||
max_num = 128
|
||||
result_path = "./result_Files/"
|
||||
result_path = result_path
|
||||
|
||||
outputs = []
|
||||
|
||||
|
@ -41,9 +42,9 @@ def get_eval_result(ann_file):
|
|||
for img_id in img_ids:
|
||||
file_id = str(img_id).zfill(12)
|
||||
|
||||
bbox_result_file = result_path + file_id + "_0.bin"
|
||||
label_result_file = result_path + file_id + "_1.bin"
|
||||
mask_result_file = result_path + file_id + "_2.bin"
|
||||
bbox_result_file = os.path.join(result_path, file_id + "_0.bin")
|
||||
label_result_file = os.path.join(result_path, file_id + "_1.bin")
|
||||
mask_result_file = os.path.join(result_path, file_id + "_2.bin")
|
||||
|
||||
all_bbox = np.fromfile(bbox_result_file, dtype=np.float16).reshape(80000, 5)
|
||||
all_label = np.fromfile(label_result_file, dtype=np.int32).reshape(80000, 1)
|
||||
|
@ -70,4 +71,4 @@ def get_eval_result(ann_file):
|
|||
coco_eval(result_files, eval_types, dataset_coco, single_result=False)
|
||||
|
||||
if __name__ == '__main__':
|
||||
get_eval_result(args.ann_file)
|
||||
get_eval_result(args.ann_file, args.result_path)
|
||||
|
|
|
@ -15,60 +15,50 @@
|
|||
# ============================================================================
|
||||
|
||||
if [[ $# -lt 3 || $# -gt 4 ]]; then
|
||||
echo "Usage: sh run_infer_310.sh [AIR_PATH] [DATA_PATH] [ANN_FILE_PATH] [DEVICE_ID]
|
||||
echo "Usage: bash run_infer_310.sh [MINDIR_PATH] [DATA_PATH] [ANN_FILE] [DEVICE_ID]
|
||||
DEVICE_ID is optional, it can be set by environment variable device_id, otherwise the value is zero"
|
||||
exit 1
|
||||
fi
|
||||
|
||||
get_real_path(){
|
||||
if [ "${1:0:1}" == "/" ]; then
|
||||
echo "$1"
|
||||
else
|
||||
echo "$(realpath -m $PWD/$1)"
|
||||
fi
|
||||
if [ "${1:0:1}" == "/" ]; then
|
||||
echo "$1"
|
||||
else
|
||||
echo "$(realpath -m $PWD/$1)"
|
||||
fi
|
||||
}
|
||||
model=$(get_real_path $1)
|
||||
data_path=$(get_real_path $2)
|
||||
ann_file=$(get_real_path $3)
|
||||
|
||||
device_id=0
|
||||
if [ $# == 4 ]; then
|
||||
device_id=$4
|
||||
elif [ $# == 3 ]; then
|
||||
# shellcheck disable=SC2153 #DEVICE_ID is en
|
||||
if [ -z $device_id ]; then
|
||||
device_id=0
|
||||
else
|
||||
device_id=$device_id
|
||||
fi
|
||||
fi
|
||||
|
||||
echo $model
|
||||
echo $data_path
|
||||
echo $ann_file
|
||||
echo $device_id
|
||||
echo "mindir name: "$model
|
||||
echo "dataset path: "$data_path
|
||||
echo "ann_file: " $ann_file
|
||||
echo "device id: "$device_id
|
||||
|
||||
export ASCEND_HOME=/usr/local/Ascend/
|
||||
if [ -d ${ASCEND_HOME}/ascend-toolkit ]; then
|
||||
export PATH=$ASCEND_HOME/ascend-toolkit/latest/fwkacllib/ccec_compiler/bin:$ASCEND_HOME/ascend-toolkit/latest/atc/bin:$PATH
|
||||
export LD_LIBRARY_PATH=/usr/local/lib:$ASCEND_HOME/ascend-toolkit/latest/atc/lib64:$ASCEND_HOME/ascend-toolkit/latest/acllib/lib64:$ASCEND_HOME/ascend-toolkit/latest/fwkacllib/lib64:$ASCEND_HOME/driver/lib64:$ASCEND_HOME/add-ones:$LD_LIBRARY_PATH
|
||||
export LD_LIBRARY_PATH=/usr/local/lib:$ASCEND_HOME/ascend-toolkit/latest/atc/lib64:$ASCEND_HOME/ascend-toolkit/latest/acllib/lib64:$ASCEND_HOME/ascend-toolkit/latest/fwkacllib/lib64:$ASCEND_HOME/driver/lib64:$ASCEND_HOME/add-ons:$LD_LIBRARY_PATH
|
||||
export TBE_IMPL_PATH=${ASCEND_HOME}/ascend-toolkit/latest/opp/op_impl/built-in/ai_core/tbe
|
||||
export PYTHONPATH=${TBE_IMPL_PATH}:$ASCEND_HOME/ascend-toolkit/latest/fwkacllib/python/site-packages:$PYTHONPATH
|
||||
export ASCEND_OPP_PATH=$ASCEND_HOME/ascend-toolkit/latest/opp
|
||||
else
|
||||
export PATH=$ASCEND_HOME/atc/ccec_compiler/bin:$ASCEND_HOME/atc/bin:$PATH
|
||||
export LD_LIBRARY_PATH=/usr/local/lib:$ASCEND_HOME/atc/lib64:$ASCEND_HOME/acllib/lib64:$ASCEND_HOME/driver/lib64:$ASCEND_HOME/add-ones:$LD_LIBRARY_PATH
|
||||
export LD_LIBRARY_PATH=/usr/local/lib:$ASCEND_HOME/atc/lib64:$ASCEND_HOME/acllib/lib64:$ASCEND_HOME/driver/lib64:$ASCEND_HOME/add-ons:$LD_LIBRARY_PATH
|
||||
export PYTHONPATH=$ASCEND_HOME/atc/python/site-packages:$PYTHONPATH
|
||||
export ASCEND_OPP_PATH=$ASCEND_HOME/opp
|
||||
fi
|
||||
|
||||
function air_to_om()
|
||||
{
|
||||
atc --input_format=NCHW --framework=1 --model=$model --input_shape="x:1, 3, 768, 1280; im_info: 1, 4" --output=fasterrcnn --insert_op_conf=../src/aipp.cfg --precision_mode=allow_fp32_to_fp16 --soc_version=Ascend310 &> atc.log
|
||||
}
|
||||
|
||||
function compile_app()
|
||||
{
|
||||
cd ../ascend310_infer/src || exit
|
||||
sh build.sh &> build.log
|
||||
cd ../ascend310_infer || exit
|
||||
bash build.sh &> build.log
|
||||
cd - || exit
|
||||
}
|
||||
|
||||
|
@ -77,24 +67,19 @@ function infer()
|
|||
if [ -d result_Files ]; then
|
||||
rm -rf ./result_Files
|
||||
fi
|
||||
if [ -d time_Result ]; then
|
||||
if [ -d time_Result ]; then
|
||||
rm -rf ./time_Result
|
||||
fi
|
||||
mkdir result_Files
|
||||
mkdir time_Result
|
||||
../ascend310_infer/src/out/main --om_path=./fasterrcnn.om --data_path=$data_path --device_id=$device_id &> infer.log
|
||||
../ascend310_infer/out/main --mindir_path=$model --dataset_path=$data_path --device_id=$device_id &> infer.log
|
||||
}
|
||||
|
||||
function cal_acc()
|
||||
{
|
||||
python ../postprocess.py --ann_file=$ann_file --img_path=$data_path &> acc.log &
|
||||
python3.7 ../postprocess.py --ann_file=$ann_file --result_path=./result_Files &> acc.log &
|
||||
}
|
||||
|
||||
air_to_om
|
||||
if [ $? -ne 0 ]; then
|
||||
echo "air to om failed"
|
||||
exit 1
|
||||
fi
|
||||
compile_app
|
||||
if [ $? -ne 0 ]; then
|
||||
echo "compile app code failed"
|
||||
|
|
|
@ -1,26 +0,0 @@
|
|||
aipp_op {
|
||||
aipp_mode : static
|
||||
input_format : YUV420SP_U8
|
||||
related_input_rank : 0
|
||||
csc_switch : true
|
||||
rbuv_swap_switch : false
|
||||
matrix_r0c0 : 256
|
||||
matrix_r0c1 : 0
|
||||
matrix_r0c2 : 359
|
||||
matrix_r1c0 : 256
|
||||
matrix_r1c1 : -88
|
||||
matrix_r1c2 : -183
|
||||
matrix_r2c0 : 256
|
||||
matrix_r2c1 : 454
|
||||
matrix_r2c2 : 0
|
||||
input_bias_0 : 0
|
||||
input_bias_1 : 128
|
||||
input_bias_2 : 128
|
||||
|
||||
mean_chn_0 : 124
|
||||
mean_chn_1 : 117
|
||||
mean_chn_2 : 104
|
||||
var_reci_chn_0 : 0.0171247538316637
|
||||
var_reci_chn_1 : 0.0175070028011204
|
||||
var_reci_chn_2 : 0.0174291938997821
|
||||
}
|
|
@ -172,7 +172,7 @@ bash run_eval.sh [VALIDATION_JSON_FILE] [CHECKPOINT_PATH]
|
|||
|
||||
```shell
|
||||
# inference
|
||||
bash run_infer_310.sh [AIR_PATH] [DATA_PATH] [ANN_FILE_PATH]
|
||||
bash run_infer_310.sh [MINDIR_PATH] [DATA_PATH] [ANN_FILE] [DEVICE_ID]
|
||||
```
|
||||
|
||||
# [Script Description](#contents)
|
||||
|
@ -203,7 +203,6 @@ bash run_eval.sh [VALIDATION_JSON_FILE] [CHECKPOINT_PATH]
|
|||
├─resnet50.py # backbone network
|
||||
├─roi_align.py # roi align network
|
||||
└─rpn.py # reagion proposal network
|
||||
├─aipp.cfg #aipp config file
|
||||
├─config.py # network configuration
|
||||
├─convert_checkpoint.py # convert resnet50 backbone checkpoint
|
||||
├─dataset.py # dataset utils
|
||||
|
@ -502,7 +501,7 @@ Accumulating evaluation results...
|
|||
python export.py --ckpt_file [CKPT_PATH] --device_target [DEVICE_TARGET] --file_format[EXPORT_FORMAT]
|
||||
```
|
||||
|
||||
`EXPORT_FORMAT` should be in ["AIR", "ONNX", "MINDIR"]
|
||||
`EXPORT_FORMAT` should be in ["AIR", "MINDIR"]
|
||||
|
||||
## Inference Process
|
||||
|
||||
|
@ -513,7 +512,7 @@ Current batch_ Size can only be set to 1. The inference process needs about 600G
|
|||
|
||||
```shell
|
||||
# Ascend310 inference
|
||||
sh run_infer_310.sh [AIR_PATH] [DATA_PATH] [ANN_FILE_PATH]
|
||||
sh run_infer_310.sh [MINDIR_PATH] [DATA_PATH] [ANN_FILE] [DEVICE_ID]
|
||||
```
|
||||
|
||||
### result
|
||||
|
|
|
@ -129,7 +129,7 @@ pip install mmcv=0.2.14
|
|||
|
||||
```bash
|
||||
# 评估
|
||||
sh run_infer_310.sh [AIR_PATH] [DATA_PATH] [ANN_FILE_PATH]
|
||||
sh run_infer_310.sh [MINDIR_PATH] [DATA_PATH] [ANN_FILE] [DEVICE_ID]
|
||||
```
|
||||
|
||||
注:
|
||||
|
@ -197,7 +197,6 @@ bash run_eval.sh [VALIDATION_JSON_FILE] [CHECKPOINT_PATH]
|
|||
├─resnet50.py # 骨干网
|
||||
├─roi_align.py # 兴趣点对齐网络
|
||||
└─rpn.py # 区域候选网络
|
||||
├─aipp.cfg #aipp 配置文件
|
||||
├─config.py # 网络配置
|
||||
├─convert_checkpoint.py # 转换预训练checkpoint文件
|
||||
├─dataset.py # 数据集工具
|
||||
|
@ -500,7 +499,7 @@ sh run_eval.sh [VALIDATION_ANN_FILE_JSON] [CHECKPOINT_PATH]
|
|||
python export.py --ckpt_file [CKPT_PATH] --device_target [DEVICE_TARGET] --file_format[EXPORT_FORMAT]
|
||||
```
|
||||
|
||||
`EXPORT_FORMAT` 选项 ["AIR", "ONNX", "MINDIR"]
|
||||
`EXPORT_FORMAT` 选项 ["AIR", "MINDIR"]
|
||||
|
||||
## 推理过程
|
||||
|
||||
|
@ -510,7 +509,7 @@ python export.py --ckpt_file [CKPT_PATH] --device_target [DEVICE_TARGET] --file_
|
|||
|
||||
```shell
|
||||
# Ascend310 推理
|
||||
sh run_infer_310.sh [AIR_PATH] [DATA_PATH] [ANN_FILE_PATH]
|
||||
sh run_infer_310.sh [MINDIR_PATH] [DATA_PATH] [ANN_FILE] [DEVICE_ID]
|
||||
```
|
||||
|
||||
### 结果
|
||||
|
|
|
@ -0,0 +1,14 @@
|
|||
cmake_minimum_required(VERSION 3.14.1)
|
||||
project(Ascend310Infer)
|
||||
add_compile_definitions(_GLIBCXX_USE_CXX11_ABI=0)
|
||||
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -O0 -g -std=c++17 -Werror -Wall -fPIE -Wl,--allow-shlib-undefined")
|
||||
set(PROJECT_SRC_ROOT ${CMAKE_CURRENT_LIST_DIR}/)
|
||||
option(MINDSPORE_PATH "mindspore install path" "")
|
||||
include_directories(${MINDSPORE_PATH})
|
||||
include_directories(${MINDSPORE_PATH}/include)
|
||||
include_directories(${PROJECT_SRC_ROOT})
|
||||
find_library(MS_LIB libmindspore.so ${MINDSPORE_PATH}/lib)
|
||||
file(GLOB_RECURSE MD_LIB ${MINDSPORE_PATH}/_c_dataengine*)
|
||||
|
||||
add_executable(main src/main.cc src/utils.cc)
|
||||
target_link_libraries(main ${MS_LIB} ${MD_LIB} gflags)
|
|
@ -0,0 +1,29 @@
|
|||
#!/bin/bash
|
||||
# Copyright 2021 Huawei Technologies Co., Ltd
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
# ============================================================================
|
||||
if [ -d out ]; then
|
||||
rm -rf out
|
||||
fi
|
||||
|
||||
mkdir out
|
||||
cd out || exit
|
||||
|
||||
if [ -f "Makefile" ]; then
|
||||
make clean
|
||||
fi
|
||||
|
||||
cmake .. \
|
||||
-DMINDSPORE_PATH="`pip3.7 show mindspore-ascend | grep Location | awk '{print $2"/mindspore"}' | xargs realpath`"
|
||||
make
|
|
@ -0,0 +1 @@
|
|||
ConvBatchnormFusionPass:off
|
|
@ -1,62 +0,0 @@
|
|||
/*
|
||||
* Copyright (c) 2020.Huawei Technologies Co., Ltd. All rights reserved.
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#ifndef ACLMANAGER_H
|
||||
#define ACLMANAGER_H
|
||||
|
||||
#include <map>
|
||||
#include <iostream>
|
||||
#include <string>
|
||||
#include <memory>
|
||||
#include <vector>
|
||||
#include "acl/acl.h"
|
||||
#include "CommonDataType.h"
|
||||
#include "ModelProcess.h"
|
||||
#include "DvppCommon.h"
|
||||
|
||||
struct ModelInfo {
|
||||
std::string modelPath;
|
||||
uint32_t modelWidth;
|
||||
uint32_t modelHeight;
|
||||
uint32_t outputNum;
|
||||
};
|
||||
|
||||
class AclProcess {
|
||||
public:
|
||||
AclProcess(int deviceId, const std::string &om_path, uint32_t width, uint32_t height);
|
||||
~AclProcess() {}
|
||||
void Release();
|
||||
int InitResource();
|
||||
int Process(const std::string& imageFile, std::map<double, double> *costTime_map);
|
||||
|
||||
private:
|
||||
int InitModule();
|
||||
int Preprocess(const std::string& imageFile);
|
||||
int ModelInfer(std::map<double, double> *costTime_map);
|
||||
int WriteResult(const std::string& imageFile);
|
||||
int ReadFile(const std::string &filePath, RawData *fileData);
|
||||
|
||||
int32_t deviceId_;
|
||||
ModelInfo modelInfo_;
|
||||
aclrtContext context_;
|
||||
aclrtStream stream_;
|
||||
std::shared_ptr<ModelProcess> modelProcess_;
|
||||
std::shared_ptr<DvppCommon> dvppCommon_;
|
||||
bool keepRatio_;
|
||||
std::vector<void *> outputBuffers_;
|
||||
std::vector<size_t> outputSizes_;
|
||||
};
|
||||
|
||||
#endif
|
|
@ -1,95 +0,0 @@
|
|||
/*
|
||||
* Copyright (c) 2020.Huawei Technologies Co., Ltd. All rights reserved.
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#ifndef COMMONDATATYPE_H
|
||||
#define COMMONDATATYPE_H
|
||||
|
||||
#include <stdio.h>
|
||||
#include <iostream>
|
||||
#include <memory>
|
||||
#include <vector>
|
||||
#include "acl/acl.h"
|
||||
#include "acl/ops/acl_dvpp.h"
|
||||
|
||||
#define DVPP_ALIGN_UP(x, align) ((((x) + ((align)-1)) / (align)) * (align))
|
||||
|
||||
#define OK 0
|
||||
#define ERROR -1
|
||||
#define INVALID_POINTER -2
|
||||
#define READ_FILE_FAIL -3
|
||||
#define OPEN_FILE_FAIL -4
|
||||
#define INIT_FAIL -5
|
||||
#define INVALID_PARAM -6
|
||||
#define DECODE_FAIL -7
|
||||
|
||||
const float SEC2MS = 1000.0;
|
||||
const int YUV_BGR_SIZE_CONVERT_3 = 3;
|
||||
const int YUV_BGR_SIZE_CONVERT_2 = 2;
|
||||
const int VPC_WIDTH_ALIGN = 16;
|
||||
const int VPC_HEIGHT_ALIGN = 2;
|
||||
|
||||
// Description of image data
|
||||
struct ImageInfo {
|
||||
uint32_t width; // Image width
|
||||
uint32_t height; // Image height
|
||||
uint32_t lenOfByte; // Size of image data, bytes
|
||||
std::shared_ptr<uint8_t> data; // Smart pointer of image data
|
||||
};
|
||||
|
||||
// Description of data in device
|
||||
struct RawData {
|
||||
size_t lenOfByte; // Size of memory, bytes
|
||||
std::shared_ptr<void> data; // Smart pointer of data
|
||||
};
|
||||
|
||||
// define the structure of an rectangle
|
||||
struct Rectangle {
|
||||
uint32_t leftTopX;
|
||||
uint32_t leftTopY;
|
||||
uint32_t rightBottomX;
|
||||
uint32_t rightBottomY;
|
||||
};
|
||||
|
||||
enum VpcProcessType {
|
||||
VPC_PT_DEFAULT = 0,
|
||||
VPC_PT_PADDING, // Resize with locked ratio and paste on upper left corner
|
||||
VPC_PT_FIT, // Resize with locked ratio and paste on middle location
|
||||
VPC_PT_FILL, // Resize with locked ratio and paste on whole locatin, the input image may be cropped
|
||||
};
|
||||
|
||||
struct DvppDataInfo {
|
||||
uint32_t width = 0; // Width of image
|
||||
uint32_t height = 0; // Height of image
|
||||
uint32_t widthStride = 0; // Width after align up
|
||||
uint32_t heightStride = 0; // Height after align up
|
||||
acldvppPixelFormat format = PIXEL_FORMAT_YUV_SEMIPLANAR_420; // Format of image
|
||||
uint32_t frameId = 0; // Needed by video
|
||||
uint32_t dataSize = 0; // Size of data in byte
|
||||
uint8_t *data = nullptr; // Image data
|
||||
};
|
||||
|
||||
struct CropRoiConfig {
|
||||
uint32_t left;
|
||||
uint32_t right;
|
||||
uint32_t down;
|
||||
uint32_t up;
|
||||
};
|
||||
|
||||
struct DvppCropInputInfo {
|
||||
DvppDataInfo dataInfo;
|
||||
CropRoiConfig roi;
|
||||
};
|
||||
|
||||
#endif
|
|
@ -1,139 +0,0 @@
|
|||
/*
|
||||
* Copyright (c) 2020.Huawei Technologies Co., Ltd. All rights reserved.
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#ifndef DVPP_COMMON_H
|
||||
#define DVPP_COMMON_H
|
||||
#include <memory>
|
||||
|
||||
#include "CommonDataType.h"
|
||||
#include "acl/ops/acl_dvpp.h"
|
||||
|
||||
const int MODULUS_NUM_2 = 2;
|
||||
const uint32_t ODD_NUM_1 = 1;
|
||||
|
||||
const uint32_t JPEGD_STRIDE_WIDTH = 128; // Jpegd module output width need to align up to 128
|
||||
const uint32_t JPEGD_STRIDE_HEIGHT = 16; // Jpegd module output height need to align up to 16
|
||||
const uint32_t VPC_STRIDE_WIDTH = 16; // Vpc module output width need to align up to 16
|
||||
const uint32_t VPC_STRIDE_HEIGHT = 2; // Vpc module output height need to align up to 2
|
||||
const uint32_t YUV422_WIDTH_NU = 2; // Width of YUV422, WidthStride = Width * 2
|
||||
const uint32_t YUV444_RGB_WIDTH_NU = 3; // Width of YUV444 and RGB888, WidthStride = Width * 3
|
||||
const uint32_t XRGB_WIDTH_NU = 4; // Width of XRGB8888, WidthStride = Width * 4
|
||||
const uint32_t JPEG_OFFSET = 8; // Offset of input file for jpegd module
|
||||
const uint32_t MAX_JPEGD_WIDTH = 8192; // Max width of jpegd module
|
||||
const uint32_t MAX_JPEGD_HEIGHT = 8192; // Max height of jpegd module
|
||||
const uint32_t MIN_JPEGD_WIDTH = 32; // Min width of jpegd module
|
||||
const uint32_t MIN_JPEGD_HEIGHT = 32; // Min height of jpegd module
|
||||
const uint32_t MAX_RESIZE_WIDTH = 4096; // Max width stride of resize module
|
||||
const uint32_t MAX_RESIZE_HEIGHT = 4096; // Max height stride of resize module
|
||||
const uint32_t MIN_RESIZE_WIDTH = 32; // Min width stride of resize module
|
||||
const uint32_t MIN_RESIZE_HEIGHT = 6; // Min height stride of resize module
|
||||
const float MIN_RESIZE_SCALE = 0.03125; // Min resize scale of resize module
|
||||
const float MAX_RESIZE_SCALE = 16.0; // Min resize scale of resize module
|
||||
const uint32_t MAX_VPC_WIDTH = 4096; // Max width of picture to VPC(resize/crop)
|
||||
const uint32_t MAX_VPC_HEIGHT = 4096; // Max height of picture to VPC(resize/crop)
|
||||
const uint32_t MIN_VPC_WIDTH = 32; // Min width of picture to VPC(resize/crop)
|
||||
const uint32_t MIN_VPC_HEIGHT = 6; // Min height of picture to VPC(resize/crop)
|
||||
const uint32_t MIN_CROP_WIDTH = 10; // Min width of crop area
|
||||
const uint32_t MIN_CROP_HEIGHT = 6; // Min height of crop area
|
||||
const uint8_t YUV_GREYER_VALUE = 128; // Filling value of the resized YUV image
|
||||
|
||||
#define CONVERT_TO_ODD(NUM) (((NUM) % MODULUS_NUM_2 != 0) ? (NUM) : ((NUM) - 1))
|
||||
#define CONVERT_TO_EVEN(NUM) (((NUM) % MODULUS_NUM_2 == 0) ? (NUM) : ((NUM) - 1))
|
||||
#define CHECK_ODD(num) ((num) % MODULUS_NUM_2 != 0)
|
||||
#define CHECK_EVEN(num) ((num) % MODULUS_NUM_2 == 0)
|
||||
#define RELEASE_DVPP_DATA(dvppDataPtr) do { \
|
||||
int retMacro; \
|
||||
if (dvppDataPtr != nullptr) { \
|
||||
retMacro = acldvppFree(dvppDataPtr); \
|
||||
if (retMacro != OK) { \
|
||||
std::cout << "Failed to free memory on dvpp, ret = " << retMacro << "." << std::endl; \
|
||||
} \
|
||||
dvppDataPtr = nullptr; \
|
||||
} \
|
||||
} while (0);
|
||||
|
||||
class DvppCommon {
|
||||
public:
|
||||
explicit DvppCommon(aclrtStream dvppStream);
|
||||
~DvppCommon();
|
||||
int Init(void);
|
||||
int DeInit(void);
|
||||
|
||||
static int GetVpcDataSize(uint32_t widthVpc, uint32_t heightVpc, acldvppPixelFormat format,
|
||||
uint32_t *vpcSize);
|
||||
|
||||
static int GetVpcInputStrideSize(uint32_t width, uint32_t height, acldvppPixelFormat format,
|
||||
uint32_t *widthStride, uint32_t *heightStride);
|
||||
|
||||
static int GetVpcOutputStrideSize(uint32_t width, uint32_t height, acldvppPixelFormat format,
|
||||
uint32_t *widthStride, uint32_t *heightStride);
|
||||
|
||||
static void GetJpegDecodeStrideSize(uint32_t width, uint32_t height, uint32_t *widthStride, uint32_t *heightStride);
|
||||
static int GetJpegImageInfo(const void *data, uint32_t dataSize, uint32_t *width, uint32_t *height,
|
||||
int32_t *components);
|
||||
|
||||
static int GetJpegDecodeDataSize(const void *data, uint32_t dataSize, acldvppPixelFormat format,
|
||||
uint32_t *decSize);
|
||||
|
||||
int VpcResize(std::shared_ptr<DvppDataInfo> input, std::shared_ptr<DvppDataInfo> output, bool withSynchronize,
|
||||
VpcProcessType processType = VPC_PT_DEFAULT);
|
||||
|
||||
int JpegDecode(std::shared_ptr<DvppDataInfo> input, std::shared_ptr<DvppDataInfo> output, bool withSynchronize);
|
||||
|
||||
int CombineResizeProcess(std::shared_ptr<DvppDataInfo> input, const DvppDataInfo &output, bool withSynchronize,
|
||||
VpcProcessType processType = VPC_PT_DEFAULT);
|
||||
|
||||
int CombineJpegdProcess(const RawData& imageInfo, acldvppPixelFormat format, bool withSynchronize);
|
||||
|
||||
std::shared_ptr<DvppDataInfo> GetInputImage();
|
||||
std::shared_ptr<DvppDataInfo> GetDecodedImage();
|
||||
std::shared_ptr<DvppDataInfo> GetResizedImage();
|
||||
|
||||
void ReleaseDvppBuffer();
|
||||
|
||||
private:
|
||||
int SetDvppPicDescData(std::shared_ptr<DvppDataInfo> dataInfo, std::shared_ptr<acldvppPicDesc>picDesc);
|
||||
int ResizeProcess(std::shared_ptr<acldvppPicDesc> inputDesc,
|
||||
std::shared_ptr<acldvppPicDesc> outputDesc, bool withSynchronize);
|
||||
|
||||
int ResizeWithPadding(std::shared_ptr<acldvppPicDesc> inputDesc, std::shared_ptr<acldvppPicDesc> outputDesc,
|
||||
const CropRoiConfig &cropRoi, const CropRoiConfig &pasteRoi, bool withSynchronize);
|
||||
|
||||
void GetCropRoi(std::shared_ptr<DvppDataInfo> input, std::shared_ptr<DvppDataInfo> output,
|
||||
VpcProcessType processType, CropRoiConfig *cropRoi);
|
||||
|
||||
void GetPasteRoi(std::shared_ptr<DvppDataInfo> input, std::shared_ptr<DvppDataInfo> output,
|
||||
VpcProcessType processType, CropRoiConfig *pasteRoi);
|
||||
|
||||
int CheckResizeParams(const DvppDataInfo &input, const DvppDataInfo &output);
|
||||
int TransferImageH2D(const RawData& imageInfo, const std::shared_ptr<DvppDataInfo>& jpegInput);
|
||||
int CreateStreamDesc(std::shared_ptr<DvppDataInfo> data);
|
||||
int DestroyResource();
|
||||
|
||||
std::shared_ptr<acldvppRoiConfig> cropAreaConfig_ = nullptr;
|
||||
std::shared_ptr<acldvppRoiConfig> pasteAreaConfig_ = nullptr;
|
||||
|
||||
std::shared_ptr<acldvppPicDesc> resizeInputDesc_ = nullptr;
|
||||
std::shared_ptr<acldvppPicDesc> resizeOutputDesc_ = nullptr;
|
||||
std::shared_ptr<acldvppPicDesc> decodeOutputDesc_ = nullptr;
|
||||
std::shared_ptr<acldvppResizeConfig> resizeConfig_ = nullptr;
|
||||
|
||||
acldvppChannelDesc *dvppChannelDesc_ = nullptr;
|
||||
aclrtStream dvppStream_ = nullptr;
|
||||
std::shared_ptr<DvppDataInfo> inputImage_ = nullptr;
|
||||
std::shared_ptr<DvppDataInfo> decodedImage_ = nullptr;
|
||||
std::shared_ptr<DvppDataInfo> resizedImage_ = nullptr;
|
||||
};
|
||||
#endif
|
|
@ -1,63 +0,0 @@
|
|||
/*
|
||||
* Copyright(C) 2020. Huawei Technologies Co.,Ltd. All rights reserved.
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#ifndef MODELPROCSS_H
|
||||
#define MODELPROCSS_H
|
||||
|
||||
#include <cstdio>
|
||||
#include <vector>
|
||||
#include <unordered_map>
|
||||
#include <mutex>
|
||||
#include <map>
|
||||
#include <memory>
|
||||
#include <string>
|
||||
#include "acl/acl.h"
|
||||
#include "CommonDataType.h"
|
||||
|
||||
class ModelProcess {
|
||||
public:
|
||||
explicit ModelProcess(const int deviceId);
|
||||
ModelProcess();
|
||||
~ModelProcess();
|
||||
|
||||
int Init(const std::string &modelPath);
|
||||
int DeInit();
|
||||
|
||||
int ModelInference(const std::vector<void *> &inputBufs,
|
||||
const std::vector<size_t> &inputSizes,
|
||||
const std::vector<void *> &ouputBufs,
|
||||
const std::vector<size_t> &outputSizes,
|
||||
std::map<double, double> *costTime_map);
|
||||
aclmdlDesc *GetModelDesc();
|
||||
int ReadBinaryFile(const std::string &fileName, uint8_t **buffShared, int *buffLength);
|
||||
|
||||
private:
|
||||
aclmdlDataset *CreateAndFillDataset(const std::vector<void *> &bufs, const std::vector<size_t> &sizes);
|
||||
void DestroyDataset(aclmdlDataset *dataset);
|
||||
|
||||
std::mutex mtx_ = {};
|
||||
int deviceId_ = 0;
|
||||
uint32_t modelId_ = 0;
|
||||
void *modelDevPtr_ = nullptr;
|
||||
size_t modelDevPtrSize_ = 0;
|
||||
void *weightDevPtr_ = nullptr;
|
||||
size_t weightDevPtrSize_ = 0;
|
||||
aclrtContext contextModel_ = nullptr;
|
||||
std::shared_ptr<aclmdlDesc> modelDesc_ = nullptr;
|
||||
bool isDeInit_ = false;
|
||||
};
|
||||
|
||||
#endif
|
|
@ -0,0 +1,32 @@
|
|||
/**
|
||||
* Copyright 2021 Huawei Technologies Co., Ltd
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#ifndef MINDSPORE_INFERENCE_UTILS_H_
|
||||
#define MINDSPORE_INFERENCE_UTILS_H_
|
||||
|
||||
#include <sys/stat.h>
|
||||
#include <dirent.h>
|
||||
#include <vector>
|
||||
#include <string>
|
||||
#include <memory>
|
||||
#include "include/api/types.h"
|
||||
|
||||
std::vector<std::string> GetAllFiles(std::string_view dirName);
|
||||
DIR *OpenDir(std::string_view dirName);
|
||||
std::string RealPath(std::string_view path);
|
||||
mindspore::MSTensor ReadFileToTensor(const std::string &file);
|
||||
int WriteResult(const std::string& imageFile, const std::vector<mindspore::MSTensor> &outputs);
|
||||
#endif
|
|
@ -1,371 +0,0 @@
|
|||
/*
|
||||
* Copyright (c) 2020.Huawei Technologies Co., Ltd. All rights reserved.
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#include "AclProcess.h"
|
||||
#include <sys/time.h>
|
||||
#include <thread>
|
||||
#include <string>
|
||||
|
||||
/*
|
||||
* @description Implementation of constructor for class AclProcess with parameter list
|
||||
* @attention context is passed in as a parameter after being created in ResourceManager::InitResource
|
||||
*/
|
||||
AclProcess::AclProcess(int deviceId, const std::string &om_path, uint32_t width, uint32_t height)
|
||||
: deviceId_(deviceId), stream_(nullptr), modelProcess_(nullptr), dvppCommon_(nullptr), keepRatio_(true) {
|
||||
modelInfo_.modelPath = om_path;
|
||||
modelInfo_.modelWidth = width;
|
||||
modelInfo_.modelHeight = height;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description Release all the resource
|
||||
* @attention context will be released in ResourceManager::Release
|
||||
*/
|
||||
void AclProcess::Release() {
|
||||
// Synchronize stream and release Dvpp channel
|
||||
dvppCommon_->DeInit();
|
||||
// Release stream
|
||||
if (stream_ != nullptr) {
|
||||
int ret = aclrtDestroyStream(stream_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to destroy the stream, ret = " << ret << ".";
|
||||
}
|
||||
stream_ = nullptr;
|
||||
}
|
||||
// Destroy resources of modelProcess_
|
||||
modelProcess_->DeInit();
|
||||
|
||||
// Release Dvpp buffer
|
||||
dvppCommon_->ReleaseDvppBuffer();
|
||||
|
||||
return;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description Initialize the modules used by this sample
|
||||
* @return int int code
|
||||
*/
|
||||
int AclProcess::InitModule() {
|
||||
// Create Dvpp common object
|
||||
if (dvppCommon_ == nullptr) {
|
||||
dvppCommon_ = std::make_shared<DvppCommon>(stream_);
|
||||
int retDvppCommon = dvppCommon_->Init();
|
||||
if (retDvppCommon != OK) {
|
||||
std::cout << "Failed to initialize dvppCommon, ret = " << retDvppCommon << std::endl;
|
||||
return retDvppCommon;
|
||||
}
|
||||
}
|
||||
// Create model inference object
|
||||
if (modelProcess_ == nullptr) {
|
||||
modelProcess_ = std::make_shared<ModelProcess>(deviceId_);
|
||||
}
|
||||
// Initialize ModelProcess module
|
||||
int ret = modelProcess_->Init(modelInfo_.modelPath);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to initialize the model process module, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
std::cout << "Initialized the model process module successfully." << std::endl;
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description Create resource for this sample
|
||||
* @return int int code
|
||||
*/
|
||||
int AclProcess::InitResource() {
|
||||
int ret = aclInit(nullptr); // Initialize ACL
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to init acl, ret = " << ret << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = aclrtSetDevice(deviceId_);
|
||||
if (ret != ACL_SUCCESS) {
|
||||
std::cout << "acl set device " << deviceId_ << "intCode = "<< static_cast<int32_t>(ret) << std::endl;
|
||||
return ret;
|
||||
}
|
||||
std::cout << "set device "<< deviceId_ << " success" << std::endl;
|
||||
|
||||
// create context (set current)
|
||||
ret = aclrtCreateContext(&context_, deviceId_);
|
||||
if (ret != ACL_SUCCESS) {
|
||||
std::cout << "acl create context failed, deviceId = " << deviceId_ <<
|
||||
"intCode = "<< static_cast<int32_t>(ret) << std::endl;
|
||||
return ret;
|
||||
}
|
||||
std::cout << "create context success" << std::endl;
|
||||
|
||||
ret = aclrtCreateStream(&stream_); // Create stream for application
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to create the acl stream, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
std::cout << "Created the acl stream successfully." << std::endl;
|
||||
// Initialize dvpp module
|
||||
if (InitModule() != OK) {
|
||||
return INIT_FAIL;
|
||||
}
|
||||
|
||||
aclmdlDesc *modelDesc = modelProcess_->GetModelDesc();
|
||||
size_t outputSize = aclmdlGetNumOutputs(modelDesc);
|
||||
modelInfo_.outputNum = outputSize;
|
||||
for (size_t i = 0; i < outputSize; i++) {
|
||||
size_t bufferSize = aclmdlGetOutputSizeByIndex(modelDesc, i);
|
||||
void *outputBuffer = nullptr;
|
||||
ret = aclrtMalloc(&outputBuffer, bufferSize, ACL_MEM_MALLOC_NORMAL_ONLY);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to malloc buffer, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
outputBuffers_.push_back(outputBuffer);
|
||||
outputSizes_.push_back(bufferSize);
|
||||
}
|
||||
|
||||
return OK;
|
||||
}
|
||||
|
||||
int AclProcess::WriteResult(const std::string& imageFile) {
|
||||
std::string homePath = "./result_Files";
|
||||
void *resHostBuf = nullptr;
|
||||
for (size_t i = 0; i < outputBuffers_.size(); ++i) {
|
||||
size_t output_size;
|
||||
void *netOutput;
|
||||
netOutput = outputBuffers_[i];
|
||||
output_size = outputSizes_[i];
|
||||
int ret = aclrtMallocHost(&resHostBuf, output_size);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to print the result, malloc host failed, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = aclrtMemcpy(resHostBuf, output_size, netOutput,
|
||||
output_size, ACL_MEMCPY_DEVICE_TO_HOST);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to print result, memcpy device to host failed, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
int pos = imageFile.rfind('/');
|
||||
std::string fileName(imageFile, pos + 1);
|
||||
fileName.replace(fileName.find('.'), fileName.size() - fileName.find('.'), "_" + std::to_string(i) + ".bin");
|
||||
|
||||
std::string outFileName = homePath + "/" + fileName;
|
||||
try {
|
||||
FILE *outputFile = fopen(outFileName.c_str(), "wb");
|
||||
if (outputFile == nullptr) {
|
||||
std::cout << "open result file " << outFileName << " failed" << std::endl;
|
||||
return INVALID_POINTER;
|
||||
}
|
||||
size_t size = fwrite(resHostBuf, sizeof(char), output_size, outputFile);
|
||||
if (size != output_size) {
|
||||
fclose(outputFile);
|
||||
outputFile = nullptr;
|
||||
std::cout << "write result file " << outFileName << " failed, write size[" << size <<
|
||||
"] is smaller than output size[" << output_size << "], maybe the disk is full." << std::endl;
|
||||
return ERROR;
|
||||
}
|
||||
fclose(outputFile);
|
||||
outputFile = nullptr;
|
||||
} catch (std::exception &e) {
|
||||
std::cout << "write result file " << outFileName << " failed, error info: " << e.what() << std::endl;
|
||||
std::exit(1);
|
||||
}
|
||||
|
||||
ret = aclrtFreeHost(resHostBuf);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclrtFree host output memory failed" << std::endl;
|
||||
return ret;
|
||||
}
|
||||
}
|
||||
return OK;
|
||||
}
|
||||
|
||||
/**
|
||||
* Read a file, store it into the RawData structure
|
||||
*
|
||||
* @param filePath file to read to
|
||||
* @param fileData RawData structure to store in
|
||||
* @return OK if create success, int code otherwise
|
||||
*/
|
||||
int AclProcess::ReadFile(const std::string &filePath, RawData *fileData) {
|
||||
// Open file with reading mode
|
||||
FILE *fp = fopen(filePath.c_str(), "rb");
|
||||
if (fp == nullptr) {
|
||||
std::cout << "Failed to open file, filePath = " << filePath << std::endl;
|
||||
return OPEN_FILE_FAIL;
|
||||
}
|
||||
// Get the length of input file
|
||||
fseek(fp, 0, SEEK_END);
|
||||
size_t fileSize = ftell(fp);
|
||||
fseek(fp, 0, SEEK_SET);
|
||||
// If file not empty, read it into FileInfo and return it
|
||||
if (fileSize > 0) {
|
||||
fileData->lenOfByte = fileSize;
|
||||
fileData->data = std::make_shared<uint8_t>();
|
||||
fileData->data.reset(new uint8_t[fileSize], std::default_delete<uint8_t[]>());
|
||||
uint32_t readRet = fread(fileData->data.get(), 1, fileSize, fp);
|
||||
if (readRet == 0) {
|
||||
fclose(fp);
|
||||
return READ_FILE_FAIL;
|
||||
}
|
||||
fclose(fp);
|
||||
return OK;
|
||||
}
|
||||
fclose(fp);
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
/*
|
||||
* @description Preprocess the input image
|
||||
* @param imageFile input image path
|
||||
* @return int int code
|
||||
*/
|
||||
int AclProcess::Preprocess(const std::string& imageFile) {
|
||||
RawData imageInfo;
|
||||
int ret = ReadFile(imageFile, &imageInfo); // Read image data from input image file
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to read file, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
// Run process of jpegD
|
||||
ret = dvppCommon_->CombineJpegdProcess(imageInfo, PIXEL_FORMAT_YUV_SEMIPLANAR_420, true);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to execute image decoded of preprocess module, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
// Get output of decode jpeg image
|
||||
std::shared_ptr<DvppDataInfo> decodeOutData = dvppCommon_->GetDecodedImage();
|
||||
// Run resize application function
|
||||
DvppDataInfo resizeOutData;
|
||||
resizeOutData.height = modelInfo_.modelHeight;
|
||||
resizeOutData.width = modelInfo_.modelWidth;
|
||||
resizeOutData.format = PIXEL_FORMAT_YUV_SEMIPLANAR_420;
|
||||
ret = dvppCommon_->CombineResizeProcess(decodeOutData, resizeOutData, true, VPC_PT_PADDING);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to execute image resized of preprocess module, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
RELEASE_DVPP_DATA(decodeOutData->data);
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description Inference of model
|
||||
* @return int int code
|
||||
*/
|
||||
int AclProcess::ModelInfer(std::map<double, double> *costTime_map) {
|
||||
// Get output of resize module
|
||||
std::shared_ptr<DvppDataInfo> resizeOutData = dvppCommon_->GetResizedImage();
|
||||
std::shared_ptr<DvppDataInfo> inputImg = dvppCommon_->GetInputImage();
|
||||
|
||||
float widthScale, heightScale;
|
||||
if (keepRatio_) {
|
||||
widthScale = static_cast<float>(resizeOutData->width) / inputImg->width;
|
||||
if (widthScale > static_cast<float>(resizeOutData->height) / inputImg->height) {
|
||||
widthScale = static_cast<float>(resizeOutData->height) / inputImg->height;
|
||||
}
|
||||
heightScale = widthScale;
|
||||
} else {
|
||||
widthScale = static_cast<float>(resizeOutData->width) / inputImg->width;
|
||||
heightScale = static_cast<float>(resizeOutData->height) / inputImg->height;
|
||||
}
|
||||
|
||||
aclFloat16 inputWidth = aclFloatToFloat16(static_cast<float>(inputImg->width));
|
||||
aclFloat16 inputHeight = aclFloatToFloat16(static_cast<float>(inputImg->height));
|
||||
aclFloat16 resizeWidthRatioFp16 = aclFloatToFloat16(widthScale);
|
||||
aclFloat16 resizeHeightRatioFp16 = aclFloatToFloat16(heightScale);
|
||||
|
||||
aclFloat16 *im_info = reinterpret_cast<aclFloat16 *>(malloc(sizeof(aclFloat16) * 4));
|
||||
im_info[0] = inputHeight;
|
||||
im_info[1] = inputWidth;
|
||||
im_info[2] = resizeHeightRatioFp16;
|
||||
im_info[3] = resizeWidthRatioFp16;
|
||||
void *imInfo_dst = nullptr;
|
||||
int ret = aclrtMalloc(&imInfo_dst, 8, ACL_MEM_MALLOC_NORMAL_ONLY);
|
||||
if (ret != ACL_ERROR_NONE) {
|
||||
std::cout << "aclrtMalloc failed, ret = " << ret << std::endl;
|
||||
aclrtFree(imInfo_dst);
|
||||
return ret;
|
||||
}
|
||||
ret = aclrtMemcpy(reinterpret_cast<uint8_t *>(imInfo_dst), 8, im_info, 8, ACL_MEMCPY_HOST_TO_DEVICE);
|
||||
if (ret != ACL_ERROR_NONE) {
|
||||
std::cout << "aclrtMemcpy failed, ret = " << ret << std::endl;
|
||||
aclrtFree(imInfo_dst);
|
||||
return ret;
|
||||
}
|
||||
|
||||
std::vector<void *> inputBuffers({resizeOutData->data, imInfo_dst});
|
||||
std::vector<size_t> inputSizes({resizeOutData->dataSize, 4 * 2});
|
||||
|
||||
for (size_t i = 0; i < modelInfo_.outputNum; i++) {
|
||||
aclrtMemset(outputBuffers_[i], outputSizes_[i], 0, outputSizes_[i]);
|
||||
}
|
||||
// Execute classification model
|
||||
ret = modelProcess_->ModelInference(inputBuffers, inputSizes, outputBuffers_, outputSizes_, costTime_map);
|
||||
if (ret != OK) {
|
||||
aclrtFree(imInfo_dst);
|
||||
std::cout << "Failed to execute the classification model, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = aclrtFree(imInfo_dst);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclrtFree image info failed" << std::endl;
|
||||
return ret;
|
||||
}
|
||||
RELEASE_DVPP_DATA(resizeOutData->data);
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description Process classification
|
||||
*
|
||||
* @par Function
|
||||
* 1.Dvpp module preprocess
|
||||
* 2.Execute classification model
|
||||
* 3.Execute single operator
|
||||
* 4.Write result
|
||||
*
|
||||
* @param imageFile input file path
|
||||
* @return int int code
|
||||
*/
|
||||
|
||||
int AclProcess::Process(const std::string& imageFile, std::map<double, double> *costTime_map) {
|
||||
struct timeval begin = {0};
|
||||
struct timeval end = {0};
|
||||
gettimeofday(&begin, nullptr);
|
||||
|
||||
int ret = Preprocess(imageFile);
|
||||
if (ret != OK) {
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = ModelInfer(costTime_map);
|
||||
if (ret != OK) {
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = WriteResult(imageFile);
|
||||
if (ret != OK) {
|
||||
std::cout << "write result failed." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
gettimeofday(&end, nullptr);
|
||||
|
||||
const double costMs = SEC2MS * (end.tv_sec - begin.tv_sec) + (end.tv_usec - begin.tv_usec) / SEC2MS;
|
||||
std::cout << "[Process Delay] cost: " << costMs << "ms." << std::endl;
|
||||
return OK;
|
||||
}
|
|
@ -1,42 +0,0 @@
|
|||
# Copyright (c) Huawei Technologies Co., Ltd. 2020. All rights reserved.
|
||||
|
||||
# CMake lowest version requirement
|
||||
cmake_minimum_required(VERSION 3.5.1)
|
||||
# Add definitions ENABLE_DVPP_INTERFACE to use dvpp api
|
||||
add_definitions(-DENABLE_DVPP_INTERFACE)
|
||||
# project information
|
||||
project(InferClassification)
|
||||
# Check environment variable
|
||||
if(NOT DEFINED ENV{ASCEND_HOME})
|
||||
message(FATAL_ERROR "please define environment variable:ASCEND_HOME")
|
||||
endif()
|
||||
|
||||
# Compile options
|
||||
add_compile_options(-std=c++11 -fPIE -g -fstack-protector-all -Werror -Wreturn-type)
|
||||
|
||||
# Skip build rpath
|
||||
set(CMAKE_SKIP_BUILD_RPATH True)
|
||||
|
||||
# Set output directory
|
||||
set(PROJECT_SRC_ROOT ${CMAKE_CURRENT_LIST_DIR}/)
|
||||
set(CMAKE_RUNTIME_OUTPUT_DIRECTORY ${PROJECT_SRC_ROOT}/out)
|
||||
|
||||
# Set include directory and library directory
|
||||
set(ACL_LIB_DIR $ENV{ASCEND_HOME}/acllib)
|
||||
set(ATLAS_ACL_LIB_DIR $ENV{ASCEND_HOME}/ascend-toolkit/latest/acllib)
|
||||
# Header path
|
||||
include_directories(${ACL_LIB_DIR}/include/)
|
||||
include_directories(${ATLAS_ACL_LIB_DIR}/include/)
|
||||
include_directories(${PROJECT_SRC_ROOT}/../inc)
|
||||
|
||||
# add host lib path
|
||||
link_directories(${ACL_LIB_DIR})
|
||||
find_library(acl libascendcl.so ${ACL_LIB_DIR}/lib64 ${ATLAS_ACL_LIB_DIR}/lib64)
|
||||
find_library(acl_dvpp libacl_dvpp.so ${ACL_LIB_DIR}/lib64 ${ATLAS_ACL_LIB_DIR}/lib64)
|
||||
|
||||
add_executable(main AclProcess.cpp
|
||||
DvppCommon.cpp
|
||||
ModelProcess.cpp
|
||||
main.cpp)
|
||||
|
||||
target_link_libraries(main ${acl} gflags ${acl_dvpp} pthread)
|
|
@ -1,735 +0,0 @@
|
|||
/*
|
||||
* Copyright (c) 2020.Huawei Technologies Co., Ltd. All rights reserved.
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#include <iostream>
|
||||
#include <memory>
|
||||
|
||||
#include "../inc/DvppCommon.h"
|
||||
#include "../inc/CommonDataType.h"
|
||||
|
||||
static auto g_resizeConfigDeleter = [](acldvppResizeConfig *p) { acldvppDestroyResizeConfig(p); };
|
||||
static auto g_picDescDeleter = [](acldvppPicDesc *picDesc) { acldvppDestroyPicDesc(picDesc); };
|
||||
static auto g_roiConfigDeleter = [](acldvppRoiConfig *p) { acldvppDestroyRoiConfig(p); };
|
||||
|
||||
DvppCommon::DvppCommon(aclrtStream dvppStream):dvppStream_(dvppStream) {}
|
||||
|
||||
/*
|
||||
* @description: Create a channel for processing image data,
|
||||
* the channel description is created by acldvppCreateChannelDesc
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::Init(void) {
|
||||
dvppChannelDesc_ = acldvppCreateChannelDesc();
|
||||
if (dvppChannelDesc_ == nullptr) {
|
||||
return -1;
|
||||
}
|
||||
int ret = acldvppCreateChannel(dvppChannelDesc_);
|
||||
if (ret != 0) {
|
||||
std::cout << "Failed to create dvpp channel, ret = " << ret << "." << std::endl;
|
||||
acldvppDestroyChannelDesc(dvppChannelDesc_);
|
||||
dvppChannelDesc_ = nullptr;
|
||||
return ret;
|
||||
}
|
||||
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: destroy the channel and the channel description used by image.
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::DeInit(void) {
|
||||
int ret = aclrtSynchronizeStream(dvppStream_); // int ret
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to synchronize stream, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = acldvppDestroyChannel(dvppChannelDesc_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to destroy dvpp channel, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = acldvppDestroyChannelDesc(dvppChannelDesc_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to destroy dvpp channel description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Release the memory that is allocated in the interfaces which are started with "Combine"
|
||||
*/
|
||||
void DvppCommon::ReleaseDvppBuffer() {
|
||||
if (resizedImage_ != nullptr) {
|
||||
RELEASE_DVPP_DATA(resizedImage_->data);
|
||||
}
|
||||
if (decodedImage_ != nullptr) {
|
||||
RELEASE_DVPP_DATA(decodedImage_->data);
|
||||
}
|
||||
if (inputImage_ != nullptr) {
|
||||
RELEASE_DVPP_DATA(inputImage_->data);
|
||||
}
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Get the size of buffer used to save image for VPC according to width, height and format
|
||||
* @param width specifies the width of the output image
|
||||
* @param height specifies the height of the output image
|
||||
* @param format specifies the format of the output image
|
||||
* @param: vpcSize is used to save the result size
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::GetVpcDataSize(uint32_t width, uint32_t height, acldvppPixelFormat format, uint32_t *vpcSize) {
|
||||
if (format != PIXEL_FORMAT_YUV_SEMIPLANAR_420 && format != PIXEL_FORMAT_YVU_SEMIPLANAR_420) {
|
||||
std::cout << "Format[" << format << "] for VPC is not supported, just support NV12 or NV21." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
uint32_t widthStride = DVPP_ALIGN_UP(width, VPC_WIDTH_ALIGN);
|
||||
uint32_t heightStride = DVPP_ALIGN_UP(height, VPC_HEIGHT_ALIGN);
|
||||
*vpcSize = widthStride * heightStride * YUV_BGR_SIZE_CONVERT_3 / YUV_BGR_SIZE_CONVERT_2;
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Get the aligned width and height of the input image according to the image format
|
||||
* @param: width specifies the width before alignment
|
||||
* @param: height specifies the height before alignment
|
||||
* @param: format specifies the image format
|
||||
* @param: widthStride is used to save the width after alignment
|
||||
* @param: heightStride is used to save the height after alignment
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::GetVpcInputStrideSize(uint32_t width, uint32_t height, acldvppPixelFormat format,
|
||||
uint32_t *widthStride, uint32_t *heightStride) {
|
||||
uint32_t inputWidthStride;
|
||||
if (format >= PIXEL_FORMAT_YUV_400 && format <= PIXEL_FORMAT_YVU_SEMIPLANAR_444) {
|
||||
inputWidthStride = DVPP_ALIGN_UP(width, VPC_STRIDE_WIDTH);
|
||||
} else if (format >= PIXEL_FORMAT_YUYV_PACKED_422 && format <= PIXEL_FORMAT_VYUY_PACKED_422) {
|
||||
inputWidthStride = DVPP_ALIGN_UP(width, VPC_STRIDE_WIDTH) * YUV422_WIDTH_NU;
|
||||
} else if (format >= PIXEL_FORMAT_YUV_PACKED_444 && format <= PIXEL_FORMAT_BGR_888) {
|
||||
inputWidthStride = DVPP_ALIGN_UP(width, VPC_STRIDE_WIDTH) * YUV444_RGB_WIDTH_NU;
|
||||
} else if (format >= PIXEL_FORMAT_ARGB_8888 && format <= PIXEL_FORMAT_BGRA_8888) {
|
||||
inputWidthStride = DVPP_ALIGN_UP(width, VPC_STRIDE_WIDTH) * XRGB_WIDTH_NU;
|
||||
} else {
|
||||
std::cout << "Input format[" << format << "] for VPC is invalid, please check it." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
uint32_t inputHeightStride = DVPP_ALIGN_UP(height, VPC_STRIDE_HEIGHT);
|
||||
if (inputWidthStride > MAX_RESIZE_WIDTH || inputWidthStride < MIN_RESIZE_WIDTH) {
|
||||
std::cout << "Input width stride " << inputWidthStride << " is invalid, not in [" << MIN_RESIZE_WIDTH \
|
||||
<< ", " << MAX_RESIZE_WIDTH << "]." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
|
||||
if (inputHeightStride > MAX_RESIZE_HEIGHT || inputHeightStride < MIN_RESIZE_HEIGHT) {
|
||||
std::cout << "Input height stride " << inputHeightStride << " is invalid, not in [" << MIN_RESIZE_HEIGHT \
|
||||
<< ", " << MAX_RESIZE_HEIGHT << "]." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
*widthStride = inputWidthStride;
|
||||
*heightStride = inputHeightStride;
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Get the aligned width and height of the output image according to the image format
|
||||
* @param: width specifies the width before alignment
|
||||
* @param: height specifies the height before alignment
|
||||
* @param: format specifies the image format
|
||||
* @param: widthStride is used to save the width after alignment
|
||||
* @param: heightStride is used to save the height after alignment
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::GetVpcOutputStrideSize(uint32_t width, uint32_t height, acldvppPixelFormat format,
|
||||
uint32_t *widthStride, uint32_t *heightStride) {
|
||||
if (format != PIXEL_FORMAT_YUV_SEMIPLANAR_420 && format != PIXEL_FORMAT_YVU_SEMIPLANAR_420) {
|
||||
std::cout << "Output format[" << format << "] is not supported, just support NV12 or NV21." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
|
||||
*widthStride = DVPP_ALIGN_UP(width, VPC_STRIDE_WIDTH);
|
||||
*heightStride = DVPP_ALIGN_UP(height, VPC_STRIDE_HEIGHT);
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Set picture description information and execute resize function
|
||||
* @param: input specifies the input image information
|
||||
* @param: output specifies the output image information
|
||||
* @param: withSynchronize specifies whether to execute synchronously
|
||||
* @param: processType specifies whether to perform proportional scaling, default is non-proportional resize
|
||||
* @return: OK if success, other values if failure
|
||||
* @attention: This function can be called only when the DvppCommon object is initialized with Init
|
||||
*/
|
||||
int DvppCommon::VpcResize(std::shared_ptr<DvppDataInfo> input, std::shared_ptr<DvppDataInfo> output,
|
||||
bool withSynchronize, VpcProcessType processType) {
|
||||
acldvppPicDesc *inputDesc = acldvppCreatePicDesc();
|
||||
acldvppPicDesc *outputDesc = acldvppCreatePicDesc();
|
||||
resizeInputDesc_.reset(inputDesc, g_picDescDeleter);
|
||||
resizeOutputDesc_.reset(outputDesc, g_picDescDeleter);
|
||||
|
||||
// Set dvpp picture descriptin info of input image
|
||||
int ret = SetDvppPicDescData(input, resizeInputDesc_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to set dvpp input picture description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
// Set dvpp picture descriptin info of output image
|
||||
ret = SetDvppPicDescData(output, resizeOutputDesc_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to set dvpp output picture description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
if (processType == VPC_PT_DEFAULT) {
|
||||
return ResizeProcess(resizeInputDesc_, resizeOutputDesc_, withSynchronize);
|
||||
}
|
||||
|
||||
// Get crop area according to the processType
|
||||
CropRoiConfig cropRoi = {0};
|
||||
GetCropRoi(input, output, processType, &cropRoi);
|
||||
|
||||
// The width and height of the original image will be resized by the same ratio
|
||||
CropRoiConfig pasteRoi = {0};
|
||||
GetPasteRoi(input, output, processType, &pasteRoi);
|
||||
|
||||
return ResizeWithPadding(resizeInputDesc_, resizeOutputDesc_, cropRoi, pasteRoi, withSynchronize);
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Set image description information
|
||||
* @param: dataInfo specifies the image information
|
||||
* @param: picsDesc specifies the picture description information to be set
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::SetDvppPicDescData(std::shared_ptr<DvppDataInfo> dataInfo, std::shared_ptr<acldvppPicDesc>picDesc) {
|
||||
int ret = acldvppSetPicDescData(picDesc.get(), dataInfo->data);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to set data for dvpp picture description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = acldvppSetPicDescSize(picDesc.get(), dataInfo->dataSize);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to set size for dvpp picture description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = acldvppSetPicDescFormat(picDesc.get(), dataInfo->format);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to set format for dvpp picture description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = acldvppSetPicDescWidth(picDesc.get(), dataInfo->width);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to set width for dvpp picture description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = acldvppSetPicDescHeight(picDesc.get(), dataInfo->height);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to set height for dvpp picture description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = acldvppSetPicDescWidthStride(picDesc.get(), dataInfo->widthStride);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to set aligned width for dvpp picture description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = acldvppSetPicDescHeightStride(picDesc.get(), dataInfo->heightStride);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to set aligned height for dvpp picture description, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Check whether the image format and zoom ratio meet the requirements
|
||||
* @param: input specifies the input image information
|
||||
* @param: output specifies the output image information
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::CheckResizeParams(const DvppDataInfo &input, const DvppDataInfo &output) {
|
||||
if (output.format != PIXEL_FORMAT_YUV_SEMIPLANAR_420 && output.format != PIXEL_FORMAT_YVU_SEMIPLANAR_420) {
|
||||
std::cout << "Output format[" << output.format << "]is not supported, just support NV12 or NV21." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
float heightScale = static_cast<float>(output.height) / input.height;
|
||||
if (heightScale < MIN_RESIZE_SCALE || heightScale > MAX_RESIZE_SCALE) {
|
||||
std::cout << "Resize scale should be in range [1/16, 32], which is " << heightScale << "." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
float widthScale = static_cast<float>(output.width) / input.width;
|
||||
if (widthScale < MIN_RESIZE_SCALE || widthScale > MAX_RESIZE_SCALE) {
|
||||
std::cout << "Resize scale should be in range [1/16, 32], which is " << widthScale << "." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Scale the input image to the size specified by the output image and
|
||||
* saves the result to the output image (non-proportionate scaling)
|
||||
* @param: inputDesc specifies the description information of the input image
|
||||
* @param: outputDesc specifies the description information of the output image
|
||||
* @param: withSynchronize specifies whether to execute synchronously
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::ResizeProcess(std::shared_ptr<acldvppPicDesc>inputDesc,
|
||||
std::shared_ptr<acldvppPicDesc>outputDesc,
|
||||
bool withSynchronize) {
|
||||
acldvppResizeConfig *resizeConfig = acldvppCreateResizeConfig();
|
||||
if (resizeConfig == nullptr) {
|
||||
std::cout << "Failed to create dvpp resize config." << std::endl;
|
||||
return INVALID_POINTER;
|
||||
}
|
||||
|
||||
resizeConfig_.reset(resizeConfig, g_resizeConfigDeleter);
|
||||
int ret = acldvppVpcResizeAsync(dvppChannelDesc_, inputDesc.get(), outputDesc.get(),
|
||||
resizeConfig_.get(), dvppStream_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to resize asynchronously, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
if (withSynchronize) {
|
||||
ret = aclrtSynchronizeStream(dvppStream_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to synchronize stream, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
}
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Crop the image from the input image based on the specified area and
|
||||
* paste the cropped image to the specified position of the target image
|
||||
* as the output image
|
||||
* @param: inputDesc specifies the description information of the input image
|
||||
* @param: outputDesc specifies the description information of the output image
|
||||
* @param: cropRoi specifies the cropped area
|
||||
* @param: pasteRoi specifies the pasting area
|
||||
* @param: withSynchronize specifies whether to execute synchronously
|
||||
* @return: OK if success, other values if failure
|
||||
* @attention: If the width and height of the crop area are different from those of the
|
||||
* paste area, the image is scaled again
|
||||
*/
|
||||
int DvppCommon::ResizeWithPadding(std::shared_ptr<acldvppPicDesc> inputDesc,
|
||||
std::shared_ptr<acldvppPicDesc> outputDesc,
|
||||
const CropRoiConfig &cropRoi, const CropRoiConfig &pasteRoi, bool withSynchronize) {
|
||||
acldvppRoiConfig *cropRoiCfg = acldvppCreateRoiConfig(cropRoi.left, cropRoi.right, cropRoi.up, cropRoi.down);
|
||||
if (cropRoiCfg == nullptr) {
|
||||
std::cout << "Failed to create dvpp roi config for corp area." << std::endl;
|
||||
return INVALID_POINTER;
|
||||
}
|
||||
cropAreaConfig_.reset(cropRoiCfg, g_roiConfigDeleter);
|
||||
|
||||
acldvppRoiConfig *pastRoiCfg = acldvppCreateRoiConfig(pasteRoi.left, pasteRoi.right, pasteRoi.up, pasteRoi.down);
|
||||
if (pastRoiCfg == nullptr) {
|
||||
std::cout << "Failed to create dvpp roi config for paster area." << std::endl;
|
||||
return INVALID_POINTER;
|
||||
}
|
||||
pasteAreaConfig_.reset(pastRoiCfg, g_roiConfigDeleter);
|
||||
|
||||
int ret = acldvppVpcCropAndPasteAsync(dvppChannelDesc_, inputDesc.get(), outputDesc.get(), cropAreaConfig_.get(),
|
||||
pasteAreaConfig_.get(), dvppStream_);
|
||||
if (ret != OK) {
|
||||
// release resource.
|
||||
std::cout << "Failed to crop and paste asynchronously, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
if (withSynchronize) {
|
||||
ret = aclrtSynchronizeStream(dvppStream_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed tp synchronize stream, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
}
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Get crop area
|
||||
* @param: input specifies the input image information
|
||||
* @param: output specifies the output image information
|
||||
* @param: processType specifies whether to perform proportional scaling
|
||||
* @param: cropRoi is used to save the info of the crop roi area
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
void DvppCommon::GetCropRoi(std::shared_ptr<DvppDataInfo> input, std::shared_ptr<DvppDataInfo> output,
|
||||
VpcProcessType processType, CropRoiConfig *cropRoi) {
|
||||
// When processType is not VPC_PT_FILL, crop area is the whole input image
|
||||
if (processType != VPC_PT_FILL) {
|
||||
cropRoi->right = CONVERT_TO_ODD(input->width - ODD_NUM_1);
|
||||
cropRoi->down = CONVERT_TO_ODD(input->height - ODD_NUM_1);
|
||||
return;
|
||||
}
|
||||
|
||||
bool widthRatioSmaller = true;
|
||||
// The scaling ratio is based on the smaller ratio to ensure the smallest edge to fill the targe edge
|
||||
float resizeRatio = static_cast<float>(input->width) / output->width;
|
||||
if (resizeRatio > (static_cast<float>(input->height) / output->height)) {
|
||||
resizeRatio = static_cast<float>(input->height) / output->height;
|
||||
widthRatioSmaller = false;
|
||||
}
|
||||
|
||||
const int halfValue = 2;
|
||||
// The left and up must be even, right and down must be odd which is required by acl
|
||||
if (widthRatioSmaller) {
|
||||
cropRoi->left = 0;
|
||||
cropRoi->right = CONVERT_TO_ODD(input->width - ODD_NUM_1);
|
||||
cropRoi->up = CONVERT_TO_EVEN(static_cast<uint32_t>((input->height - output->height * resizeRatio) /
|
||||
halfValue));
|
||||
cropRoi->down = CONVERT_TO_ODD(input->height - cropRoi->up - ODD_NUM_1);
|
||||
return;
|
||||
}
|
||||
|
||||
cropRoi->up = 0;
|
||||
cropRoi->down = CONVERT_TO_ODD(input->height - ODD_NUM_1);
|
||||
cropRoi->left = CONVERT_TO_EVEN(static_cast<uint32_t>((input->width - output->width * resizeRatio) / halfValue));
|
||||
cropRoi->right = CONVERT_TO_ODD(input->width - cropRoi->left - ODD_NUM_1);
|
||||
return;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Get paste area
|
||||
* @param: input specifies the input image information
|
||||
* @param: output specifies the output image information
|
||||
* @param: processType specifies whether to perform proportional scaling
|
||||
* @param: pasteRio is used to save the info of the paste area
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
void DvppCommon::GetPasteRoi(std::shared_ptr<DvppDataInfo> input, std::shared_ptr<DvppDataInfo> output,
|
||||
VpcProcessType processType, CropRoiConfig *pasteRoi) {
|
||||
if (processType == VPC_PT_FILL) {
|
||||
pasteRoi->right = CONVERT_TO_ODD(output->width - ODD_NUM_1);
|
||||
pasteRoi->down = CONVERT_TO_ODD(output->height - ODD_NUM_1);
|
||||
return;
|
||||
}
|
||||
|
||||
bool widthRatioLarger = true;
|
||||
// The scaling ratio is based on the larger ratio to ensure the largest edge to fill the targe edge
|
||||
float resizeRatio = static_cast<float>(input->width) / output->width;
|
||||
if (resizeRatio < (static_cast<float>(input->height) / output->height)) {
|
||||
resizeRatio = static_cast<float>(input->height) / output->height;
|
||||
widthRatioLarger = false;
|
||||
}
|
||||
|
||||
// Left and up is 0 when the roi paste on the upper left corner
|
||||
if (processType == VPC_PT_PADDING) {
|
||||
pasteRoi->right = (input->width / resizeRatio) - ODD_NUM_1;
|
||||
pasteRoi->down = (input->height / resizeRatio) - ODD_NUM_1;
|
||||
pasteRoi->right = CONVERT_TO_ODD(pasteRoi->right);
|
||||
pasteRoi->down = CONVERT_TO_ODD(pasteRoi->down);
|
||||
return;
|
||||
}
|
||||
|
||||
const int halfValue = 2;
|
||||
// Left and up is 0 when the roi paste on the middler location
|
||||
if (widthRatioLarger) {
|
||||
pasteRoi->left = 0;
|
||||
pasteRoi->right = output->width - ODD_NUM_1;
|
||||
pasteRoi->up = (output->height - (input->height / resizeRatio)) / halfValue;
|
||||
pasteRoi->down = output->height - pasteRoi->up - ODD_NUM_1;
|
||||
} else {
|
||||
pasteRoi->up = 0;
|
||||
pasteRoi->down = output->height - ODD_NUM_1;
|
||||
pasteRoi->left = (output->width - (input->width / resizeRatio)) / halfValue;
|
||||
pasteRoi->right = output->width - pasteRoi->left - ODD_NUM_1;
|
||||
}
|
||||
|
||||
// The left must be even and align to 16, up must be even, right and down must be odd which is required by acl
|
||||
pasteRoi->left = DVPP_ALIGN_UP(CONVERT_TO_EVEN(pasteRoi->left), VPC_WIDTH_ALIGN);
|
||||
pasteRoi->right = CONVERT_TO_ODD(pasteRoi->right);
|
||||
pasteRoi->up = CONVERT_TO_EVEN(pasteRoi->up);
|
||||
pasteRoi->down = CONVERT_TO_ODD(pasteRoi->down);
|
||||
return;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Resize the image specified by input and save the result to member variable resizedImage_
|
||||
* @param: input specifies the input image information
|
||||
* @param: output specifies the output image information
|
||||
* @param: withSynchronize specifies whether to execute synchronously
|
||||
* @param: processType specifies whether to perform proportional scaling, default is non-proportional resize
|
||||
* @return: OK if success, other values if failure
|
||||
* @attention: This function can be called only when the DvppCommon object is initialized with Init
|
||||
*/
|
||||
int DvppCommon::CombineResizeProcess(std::shared_ptr<DvppDataInfo> input, const DvppDataInfo &output,
|
||||
bool withSynchronize, VpcProcessType processType) {
|
||||
int ret = CheckResizeParams(*input, output);
|
||||
if (ret != OK) {
|
||||
return ret;
|
||||
}
|
||||
// Get widthStride and heightStride for input and output image according to the format
|
||||
ret = GetVpcInputStrideSize(input->widthStride, input->heightStride, input->format,
|
||||
&(input->widthStride), &(input->heightStride));
|
||||
if (ret != OK) {
|
||||
return ret;
|
||||
}
|
||||
|
||||
resizedImage_ = std::make_shared<DvppDataInfo>();
|
||||
resizedImage_->width = output.width;
|
||||
resizedImage_->height = output.height;
|
||||
resizedImage_->format = output.format;
|
||||
ret = GetVpcOutputStrideSize(output.width, output.height, output.format, &(resizedImage_->widthStride),
|
||||
&(resizedImage_->heightStride));
|
||||
if (ret != OK) {
|
||||
return ret;
|
||||
}
|
||||
// Get output buffer size for resize output
|
||||
ret = GetVpcDataSize(output.width, output.height, output.format, &(resizedImage_->dataSize));
|
||||
if (ret != OK) {
|
||||
return ret;
|
||||
}
|
||||
// Malloc buffer for output of resize module
|
||||
// Need to pay attention to release of the buffer
|
||||
ret = acldvppMalloc(reinterpret_cast<void **>(&(resizedImage_->data)), resizedImage_->dataSize);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to malloc " << resizedImage_->dataSize << " bytes on dvpp for resize" << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
aclrtMemset(resizedImage_->data, resizedImage_->dataSize, YUV_GREYER_VALUE, resizedImage_->dataSize);
|
||||
resizedImage_->frameId = input->frameId;
|
||||
ret = VpcResize(input, resizedImage_, withSynchronize, processType);
|
||||
if (ret != OK) {
|
||||
// Release the output buffer when resize failed, otherwise release it after use
|
||||
RELEASE_DVPP_DATA(resizedImage_->data);
|
||||
}
|
||||
return ret;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Set the description of the output image and decode
|
||||
* @param: input specifies the input image information
|
||||
* @param: output specifies the output image information
|
||||
* @param: withSynchronize specifies whether to execute synchronously
|
||||
* @return: OK if success, other values if failure
|
||||
* @attention: This function can be called only when the DvppCommon object is initialized with Init
|
||||
*/
|
||||
int DvppCommon::JpegDecode(std::shared_ptr<DvppDataInfo> input,
|
||||
std::shared_ptr<DvppDataInfo> output,
|
||||
bool withSynchronize) {
|
||||
acldvppPicDesc *outputDesc = acldvppCreatePicDesc();
|
||||
decodeOutputDesc_.reset(outputDesc, g_picDescDeleter);
|
||||
|
||||
int ret = SetDvppPicDescData(output, decodeOutputDesc_);
|
||||
if (ret != OK) {
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = acldvppJpegDecodeAsync(dvppChannelDesc_, input->data, input->dataSize, decodeOutputDesc_.get(), dvppStream_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to decode jpeg, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
if (withSynchronize) {
|
||||
ret = aclrtSynchronizeStream(dvppStream_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to synchronize stream, ret = " << ret << "." << std::endl;
|
||||
return DECODE_FAIL;
|
||||
}
|
||||
}
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Get the aligned width and height of the image after decoding
|
||||
* @param: width specifies the width before alignment
|
||||
* @param: height specifies the height before alignment
|
||||
* @param: widthStride is used to save the width after alignment
|
||||
* @param: heightStride is used to save the height after alignment
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
void DvppCommon::GetJpegDecodeStrideSize(uint32_t width, uint32_t height,
|
||||
uint32_t *widthStride, uint32_t *heightStride) {
|
||||
*widthStride = DVPP_ALIGN_UP(width, JPEGD_STRIDE_WIDTH);
|
||||
*heightStride = DVPP_ALIGN_UP(height, JPEGD_STRIDE_HEIGHT);
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Get picture width and height and number of channels from image data
|
||||
* @param: data specifies the memory to store the image data
|
||||
* @param: dataSize specifies the size of the image data
|
||||
* @param: width is used to save the image width
|
||||
* @param: height is used to save the image height
|
||||
* @param: components is used to save the number of channels
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::GetJpegImageInfo(const void *data, uint32_t dataSize, uint32_t *width, uint32_t *height,
|
||||
int32_t *components) {
|
||||
uint32_t widthTmp;
|
||||
uint32_t heightTmp;
|
||||
int32_t componentsTmp;
|
||||
int ret = acldvppJpegGetImageInfo(data, dataSize, &widthTmp, &heightTmp, &componentsTmp);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to get image info of jpeg, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
if (widthTmp > MAX_JPEGD_WIDTH || widthTmp < MIN_JPEGD_WIDTH) {
|
||||
std::cout << "Input width is invalid, not in [" << MIN_JPEGD_WIDTH << ", "
|
||||
<< MAX_JPEGD_WIDTH << "]." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
if (heightTmp > MAX_JPEGD_HEIGHT || heightTmp < MIN_JPEGD_HEIGHT) {
|
||||
std::cout << "Input height is invalid, not in [" << MIN_JPEGD_HEIGHT << ", "
|
||||
<< MAX_JPEGD_HEIGHT << "]." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
*width = widthTmp;
|
||||
*height = heightTmp;
|
||||
*components = componentsTmp;
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Get the size of the buffer for storing decoded images based on the image data, size, and format
|
||||
* @param: data specifies the memory to store the image data
|
||||
* @param: dataSize specifies the size of the image data
|
||||
* @param: format specifies the image format
|
||||
* @param: decSize is used to store the result size
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::GetJpegDecodeDataSize(const void *data, uint32_t dataSize, acldvppPixelFormat format,
|
||||
uint32_t *decSize) {
|
||||
uint32_t outputSize;
|
||||
int ret = acldvppJpegPredictDecSize(data, dataSize, format, &outputSize);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to predict decode size of jpeg image, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
*decSize = outputSize;
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Decode the image specified by imageInfo and save the result to member variable decodedImage_
|
||||
* @param: imageInfo specifies image information
|
||||
* @param: format specifies the image format
|
||||
* @param: withSynchronize specifies whether to execute synchronously
|
||||
* @return: OK if success, other values if failure
|
||||
* @attention: This function can be called only when the DvppCommon object is initialized with Init
|
||||
*/
|
||||
int DvppCommon::CombineJpegdProcess(const RawData& imageInfo, acldvppPixelFormat format, bool withSynchronize) {
|
||||
int32_t components;
|
||||
inputImage_ = std::make_shared<DvppDataInfo>();
|
||||
inputImage_->format = format;
|
||||
int ret = GetJpegImageInfo(imageInfo.data.get(), imageInfo.lenOfByte, &(inputImage_->width), &(inputImage_->height),
|
||||
&components);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to get input image info, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
// Get the buffer size of decode output according to the input data and output format
|
||||
uint32_t outBuffSize;
|
||||
ret = GetJpegDecodeDataSize(imageInfo.data.get(), imageInfo.lenOfByte, format, &outBuffSize);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to get size of decode output buffer, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
// In TransferImageH2D function, device buffer will be allocated to store the input image
|
||||
// Need to pay attention to release of the buffer
|
||||
ret = TransferImageH2D(imageInfo, inputImage_);
|
||||
if (ret != OK) {
|
||||
return ret;
|
||||
}
|
||||
|
||||
decodedImage_ = std::make_shared<DvppDataInfo>();
|
||||
decodedImage_->format = format;
|
||||
decodedImage_->width = inputImage_->width;
|
||||
decodedImage_->height = inputImage_->height;
|
||||
GetJpegDecodeStrideSize(inputImage_->width, inputImage_->height, &(decodedImage_->widthStride),
|
||||
&(decodedImage_->heightStride));
|
||||
decodedImage_->dataSize = outBuffSize;
|
||||
// Need to pay attention to release of the buffer
|
||||
ret = acldvppMalloc(reinterpret_cast<void **>(&decodedImage_->data), decodedImage_->dataSize);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to malloc memory on dvpp, ret = " << ret << "." << std::endl;
|
||||
RELEASE_DVPP_DATA(inputImage_->data);
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = JpegDecode(inputImage_, decodedImage_, withSynchronize);
|
||||
if (ret != OK) {
|
||||
RELEASE_DVPP_DATA(inputImage_->data);
|
||||
inputImage_->data = nullptr;
|
||||
RELEASE_DVPP_DATA(decodedImage_->data);
|
||||
decodedImage_->data = nullptr;
|
||||
return ret;
|
||||
}
|
||||
|
||||
return OK;
|
||||
}
|
||||
|
||||
/*
|
||||
* @description: Transfer data from host to device
|
||||
* @param: imageInfo specifies the image data on the host
|
||||
* @param: jpegInput is used to save the buffer and its size which is allocate on the device
|
||||
* @return: OK if success, other values if failure
|
||||
*/
|
||||
int DvppCommon::TransferImageH2D(const RawData& imageInfo, const std::shared_ptr<DvppDataInfo>& jpegInput) {
|
||||
if (imageInfo.lenOfByte == 0) {
|
||||
std::cout << "The input buffer size on host should not be empty." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
|
||||
uint8_t* inDevBuff = nullptr;
|
||||
int ret = acldvppMalloc(reinterpret_cast<void **>(&inDevBuff), imageInfo.lenOfByte);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to malloc " << imageInfo.lenOfByte << " bytes on dvpp, ret = " << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
// Copy the image data from host to device
|
||||
ret = aclrtMemcpyAsync(inDevBuff, imageInfo.lenOfByte, imageInfo.data.get(), imageInfo.lenOfByte,
|
||||
ACL_MEMCPY_HOST_TO_DEVICE, dvppStream_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to copy " << imageInfo.lenOfByte << " bytes from host to device" << std::endl;
|
||||
RELEASE_DVPP_DATA(inDevBuff);
|
||||
return ret;
|
||||
}
|
||||
// Attention: We must call the aclrtSynchronizeStream to ensure the task of memory replication has been completed
|
||||
// after calling aclrtMemcpyAsync
|
||||
ret = aclrtSynchronizeStream(dvppStream_);
|
||||
if (ret != OK) {
|
||||
std::cout << "Failed to synchronize stream, ret = " << ret << "." << std::endl;
|
||||
RELEASE_DVPP_DATA(inDevBuff);
|
||||
return ret;
|
||||
}
|
||||
jpegInput->data = inDevBuff;
|
||||
jpegInput->dataSize = imageInfo.lenOfByte;
|
||||
return OK;
|
||||
}
|
||||
|
||||
std::shared_ptr<DvppDataInfo> DvppCommon::GetInputImage() {
|
||||
return inputImage_;
|
||||
}
|
||||
|
||||
std::shared_ptr<DvppDataInfo> DvppCommon::GetDecodedImage() {
|
||||
return decodedImage_;
|
||||
}
|
||||
|
||||
std::shared_ptr<DvppDataInfo> DvppCommon::GetResizedImage() {
|
||||
return resizedImage_;
|
||||
}
|
||||
|
||||
DvppCommon::~DvppCommon() {}
|
|
@ -1,226 +0,0 @@
|
|||
/*
|
||||
* Copyright(C) 2020. Huawei Technologies Co.,Ltd. All rights reserved.
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#include <sys/time.h>
|
||||
#include <fstream>
|
||||
#include "../inc/ModelProcess.h"
|
||||
|
||||
ModelProcess::ModelProcess(const int deviceId) {
|
||||
deviceId_ = deviceId;
|
||||
}
|
||||
|
||||
ModelProcess::ModelProcess() {}
|
||||
|
||||
ModelProcess::~ModelProcess() {
|
||||
if (!isDeInit_) {
|
||||
DeInit();
|
||||
}
|
||||
}
|
||||
|
||||
void ModelProcess::DestroyDataset(aclmdlDataset *dataset) {
|
||||
// Just release the DataBuffer object and DataSet object, remain the buffer, because it is managerd by user
|
||||
if (dataset != nullptr) {
|
||||
for (size_t i = 0; i < aclmdlGetDatasetNumBuffers(dataset); i++) {
|
||||
aclDataBuffer* dataBuffer = aclmdlGetDatasetBuffer(dataset, i);
|
||||
if (dataBuffer != nullptr) {
|
||||
aclDestroyDataBuffer(dataBuffer);
|
||||
dataBuffer = nullptr;
|
||||
}
|
||||
}
|
||||
aclmdlDestroyDataset(dataset);
|
||||
}
|
||||
}
|
||||
|
||||
aclmdlDesc *ModelProcess::GetModelDesc() {
|
||||
return modelDesc_.get();
|
||||
}
|
||||
|
||||
int ModelProcess::ModelInference(const std::vector<void *> &inputBufs,
|
||||
const std::vector<size_t> &inputSizes,
|
||||
const std::vector<void *> &ouputBufs,
|
||||
const std::vector<size_t> &outputSizes,
|
||||
std::map<double, double> *costTime_map) {
|
||||
std::cout << "ModelProcess:Begin to inference." << std::endl;
|
||||
aclmdlDataset *input = nullptr;
|
||||
input = CreateAndFillDataset(inputBufs, inputSizes);
|
||||
if (input == nullptr) {
|
||||
return INVALID_POINTER;
|
||||
}
|
||||
int ret;
|
||||
|
||||
aclmdlDataset *output = nullptr;
|
||||
output = CreateAndFillDataset(ouputBufs, outputSizes);
|
||||
if (output == nullptr) {
|
||||
DestroyDataset(input);
|
||||
input = nullptr;
|
||||
return INVALID_POINTER;
|
||||
}
|
||||
struct timeval start;
|
||||
struct timeval end;
|
||||
double startTime_ms;
|
||||
double endTime_ms;
|
||||
mtx_.lock();
|
||||
gettimeofday(&start, NULL);
|
||||
ret = aclmdlExecute(modelId_, input, output);
|
||||
gettimeofday(&end, NULL);
|
||||
startTime_ms = (1.0 * start.tv_sec * 1000000 + start.tv_usec) / 1000;
|
||||
endTime_ms = (1.0 * end.tv_sec * 1000000 + end.tv_usec) / 1000;
|
||||
costTime_map->insert(std::pair<double, double>(startTime_ms, endTime_ms));
|
||||
mtx_.unlock();
|
||||
if (ret != OK) {
|
||||
std::cout << "aclmdlExecute failed, ret[" << ret << "]." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
DestroyDataset(input);
|
||||
DestroyDataset(output);
|
||||
return OK;
|
||||
}
|
||||
|
||||
int ModelProcess::DeInit() {
|
||||
isDeInit_ = true;
|
||||
int ret = aclmdlUnload(modelId_);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclmdlUnload failed, ret["<< ret << "]." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
if (modelDevPtr_ != nullptr) {
|
||||
ret = aclrtFree(modelDevPtr_);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclrtFree failed, ret[" << ret << "]." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
modelDevPtr_ = nullptr;
|
||||
}
|
||||
if (weightDevPtr_ != nullptr) {
|
||||
ret = aclrtFree(weightDevPtr_);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclrtFree failed, ret[" << ret << "]." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
weightDevPtr_ = nullptr;
|
||||
}
|
||||
|
||||
return OK;
|
||||
}
|
||||
/**
|
||||
* Read a binary file, store the data into a uint8_t array
|
||||
*
|
||||
* @param fileName the file for reading
|
||||
* @param buffShared a shared pointer to a uint8_t array for storing file
|
||||
* @param buffLength the length of the array
|
||||
* @return OK if create success, error code otherwise
|
||||
*/
|
||||
int ModelProcess::ReadBinaryFile(const std::string &fileName, uint8_t **buffShared, int *buffLength) {
|
||||
std::ifstream inFile(fileName, std::ios::in | std::ios::binary);
|
||||
if (!inFile) {
|
||||
std::cout << "FaceFeatureLib: read file " << fileName << " fail." <<std::endl;
|
||||
return READ_FILE_FAIL;
|
||||
}
|
||||
|
||||
inFile.seekg(0, inFile.end);
|
||||
*buffLength = inFile.tellg();
|
||||
inFile.seekg(0, inFile.beg);
|
||||
|
||||
uint8_t *tempShared = reinterpret_cast<uint8_t *>(malloc(*buffLength));
|
||||
inFile.read(reinterpret_cast<char *>(tempShared), *buffLength);
|
||||
inFile.close();
|
||||
*buffShared = tempShared;
|
||||
|
||||
std::cout << "read file: fileName=" << fileName << ", size=" << *buffLength << "." << std::endl;
|
||||
|
||||
return OK;
|
||||
}
|
||||
|
||||
int ModelProcess::Init(const std::string &modelPath) {
|
||||
std::cout << "ModelProcess:Begin to init instance." << std::endl;
|
||||
int modelSize = 0;
|
||||
uint8_t *modelData = nullptr;
|
||||
int ret = ReadBinaryFile(modelPath, &modelData, &modelSize);
|
||||
if (ret != OK) {
|
||||
std::cout << "read model file failed, ret[" << ret << "]." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = aclmdlQuerySizeFromMem(modelData, modelSize, &modelDevPtrSize_, &weightDevPtrSize_);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclmdlQuerySizeFromMem failed, ret[" << ret << "]." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
std::cout << "modelDevPtrSize_[" << modelDevPtrSize_ << "]" << std::endl;
|
||||
std::cout << " weightDevPtrSize_[" << weightDevPtrSize_ << "]." << std::endl;
|
||||
|
||||
ret = aclrtMalloc(&modelDevPtr_, modelDevPtrSize_, ACL_MEM_MALLOC_HUGE_FIRST);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclrtMalloc dev_ptr failed, ret[" << ret << "]." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = aclrtMalloc(&weightDevPtr_, weightDevPtrSize_, ACL_MEM_MALLOC_HUGE_FIRST);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclrtMalloc weight_ptr failed, ret[" << ret << "] " << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = aclmdlLoadFromMemWithMem(modelData, modelSize, &modelId_, modelDevPtr_, modelDevPtrSize_,
|
||||
weightDevPtr_, weightDevPtrSize_);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclmdlLoadFromMemWithMem failed, ret[" << ret << "]." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = aclrtGetCurrentContext(&contextModel_);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclrtMalloc weight_ptr failed, ret[" << ret << "]." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
|
||||
aclmdlDesc *modelDesc = aclmdlCreateDesc();
|
||||
if (modelDesc == nullptr) {
|
||||
std::cout << "aclmdlCreateDesc failed." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
ret = aclmdlGetDesc(modelDesc, modelId_);
|
||||
if (ret != OK) {
|
||||
std::cout << "aclmdlGetDesc ret fail, ret:" << ret << "." << std::endl;
|
||||
return ret;
|
||||
}
|
||||
modelDesc_.reset(modelDesc, aclmdlDestroyDesc);
|
||||
free(modelData);
|
||||
return OK;
|
||||
}
|
||||
|
||||
aclmdlDataset *ModelProcess::CreateAndFillDataset(const std::vector<void *> &bufs, const std::vector<size_t> &sizes) {
|
||||
aclmdlDataset *dataset = aclmdlCreateDataset();
|
||||
if (dataset == nullptr) {
|
||||
std::cout << "ACL_ModelInputCreate failed." << std::endl;
|
||||
return nullptr;
|
||||
}
|
||||
|
||||
for (size_t i = 0; i < bufs.size(); ++i) {
|
||||
aclDataBuffer *data = aclCreateDataBuffer(bufs[i], sizes[i]);
|
||||
if (data == nullptr) {
|
||||
DestroyDataset(dataset);
|
||||
std::cout << "aclCreateDataBuffer failed." << std::endl;
|
||||
return nullptr;
|
||||
}
|
||||
|
||||
int ret = aclmdlAddDatasetBuffer(dataset, data);
|
||||
if (ret != OK) {
|
||||
DestroyDataset(dataset);
|
||||
std::cout << "ACL_ModelInputDataAdd failed, ret[" << ret << "]." << std::endl;
|
||||
return nullptr;
|
||||
}
|
||||
}
|
||||
return dataset;
|
||||
}
|
|
@ -1,56 +0,0 @@
|
|||
#!/bin/bash
|
||||
# Copyright 2020 Huawei Technologies Co., Ltd
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
# ============================================================================
|
||||
path_cur=$(cd "`dirname $0`" || exit; pwd)
|
||||
build_type="Release"
|
||||
|
||||
function preparePath() {
|
||||
rm -rf $1
|
||||
mkdir -p $1
|
||||
cd $1 || exit
|
||||
}
|
||||
|
||||
function buildA300() {
|
||||
if [ ! "${ARCH_PATTERN}" ]; then
|
||||
# set ARCH_PATTERN to acllib when it was not specified by user
|
||||
export ARCH_PATTERN=acllib
|
||||
echo "ARCH_PATTERN is set to the default value: ${ARCH_PATTERN}"
|
||||
else
|
||||
echo "ARCH_PATTERN is set to ${ARCH_PATTERN} by user, reset it to ${ARCH_PATTERN}/acllib"
|
||||
export ARCH_PATTERN=${ARCH_PATTERN}/acllib
|
||||
fi
|
||||
|
||||
path_build=$path_cur/build
|
||||
preparePath $path_build
|
||||
cmake -DCMAKE_BUILD_TYPE=$build_type ..
|
||||
make -j
|
||||
ret=$?
|
||||
cd ..
|
||||
return ${ret}
|
||||
}
|
||||
|
||||
# set ASCEND_VERSION to ascend-toolkit/latest when it was not specified by user
|
||||
if [ ! "${ASCEND_VERSION}" ]; then
|
||||
export ASCEND_VERSION=ascend-toolkit/latest
|
||||
echo "Set ASCEND_VERSION to the default value: ${ASCEND_VERSION}"
|
||||
else
|
||||
echo "ASCEND_VERSION is set to ${ASCEND_VERSION} by user"
|
||||
fi
|
||||
|
||||
buildA300
|
||||
|
||||
if [ $? -ne 0 ]; then
|
||||
exit 1
|
||||
fi
|
|
@ -0,0 +1,235 @@
|
|||
/**
|
||||
* Copyright 2021 Huawei Technologies Co., Ltd
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
#include <sys/time.h>
|
||||
#include <gflags/gflags.h>
|
||||
#include <dirent.h>
|
||||
#include <iostream>
|
||||
#include <string>
|
||||
#include <algorithm>
|
||||
#include <iosfwd>
|
||||
#include <vector>
|
||||
#include <fstream>
|
||||
#include <sstream>
|
||||
|
||||
#include "include/api/context.h"
|
||||
#include "include/api/model.h"
|
||||
#include "include/api/types.h"
|
||||
#include "include/api/serialization.h"
|
||||
#include "include/minddata/dataset/include/vision.h"
|
||||
#include "include/minddata/dataset/include/transforms.h"
|
||||
#include "include/minddata/dataset/include/execute.h"
|
||||
#include "../inc/utils.h"
|
||||
|
||||
using mindspore::Context;
|
||||
using mindspore::Serialization;
|
||||
using mindspore::Model;
|
||||
using mindspore::Status;
|
||||
using mindspore::ModelType;
|
||||
using mindspore::GraphCell;
|
||||
using mindspore::kSuccess;
|
||||
using mindspore::MSTensor;
|
||||
using mindspore::DataType;
|
||||
using mindspore::dataset::Execute;
|
||||
using mindspore::dataset::TensorTransform;
|
||||
using mindspore::dataset::vision::Resize;
|
||||
using mindspore::dataset::vision::Pad;
|
||||
using mindspore::dataset::vision::HWC2CHW;
|
||||
using mindspore::dataset::vision::Normalize;
|
||||
using mindspore::dataset::vision::SwapRedBlue;
|
||||
using mindspore::dataset::vision::Decode;
|
||||
using mindspore::dataset::transforms::TypeCast;
|
||||
|
||||
|
||||
DEFINE_string(mindir_path, "", "mindir path");
|
||||
DEFINE_string(dataset_path, ".", "dataset path");
|
||||
DEFINE_int32(device_id, 0, "device id");
|
||||
|
||||
const int IMAGEWIDTH = 1280;
|
||||
const int IMAGEHEIGHT = 768;
|
||||
|
||||
int PadImage(const MSTensor &input, MSTensor *output) {
|
||||
std::shared_ptr<TensorTransform> normalize(new Normalize({103.53, 116.28, 123.675},
|
||||
{57.375, 57.120, 58.395}));
|
||||
Execute composeNormalize({normalize});
|
||||
std::vector<int64_t> shape = input.Shape();
|
||||
auto imgResize = MSTensor();
|
||||
auto imgPad = MSTensor();
|
||||
|
||||
float widthScale, heightScale;
|
||||
widthScale = static_cast<float>(IMAGEWIDTH) / shape[1];
|
||||
heightScale = static_cast<float>(IMAGEHEIGHT) / shape[0];
|
||||
Status ret;
|
||||
if (widthScale < heightScale) {
|
||||
int heightSize = shape[0]*widthScale;
|
||||
std::shared_ptr<TensorTransform> resize(new Resize({heightSize, IMAGEWIDTH}));
|
||||
Execute composeResizeWidth({resize});
|
||||
ret = composeResizeWidth(input, &imgResize);
|
||||
if (ret != kSuccess) {
|
||||
std::cout << "ERROR: Resize Width failed." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
|
||||
int paddingSize = IMAGEHEIGHT - heightSize;
|
||||
std::shared_ptr<TensorTransform> pad(new Pad({0, 0, 0, paddingSize}));
|
||||
Execute composePad({pad});
|
||||
ret = composePad(imgResize, &imgPad);
|
||||
if (ret != kSuccess) {
|
||||
std::cout << "ERROR: Height Pad failed." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
|
||||
ret = composeNormalize(imgPad, output);
|
||||
if (ret != kSuccess) {
|
||||
std::cout << "ERROR: Normalize failed." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
} else {
|
||||
int widthSize = shape[1]*heightScale;
|
||||
std::shared_ptr<TensorTransform> resize(new Resize({IMAGEHEIGHT, widthSize}));
|
||||
Execute composeResizeHeight({resize});
|
||||
ret = composeResizeHeight(input, &imgResize);
|
||||
if (ret != kSuccess) {
|
||||
std::cout << "ERROR: Resize Height failed." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
|
||||
int paddingSize = IMAGEWIDTH - widthSize;
|
||||
std::shared_ptr<TensorTransform> pad(new Pad({0, 0, paddingSize, 0}));
|
||||
Execute composePad({pad});
|
||||
ret = composePad(imgResize, &imgPad);
|
||||
if (ret != kSuccess) {
|
||||
std::cout << "ERROR: Width Pad failed." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
|
||||
ret = composeNormalize(imgPad, output);
|
||||
if (ret != kSuccess) {
|
||||
std::cout << "ERROR: Normalize failed." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
}
|
||||
return 0;
|
||||
}
|
||||
|
||||
int main(int argc, char **argv) {
|
||||
gflags::ParseCommandLineFlags(&argc, &argv, true);
|
||||
if (RealPath(FLAGS_mindir_path).empty()) {
|
||||
std::cout << "Invalid mindir" << std::endl;
|
||||
return 1;
|
||||
}
|
||||
|
||||
auto context = std::make_shared<Context>();
|
||||
auto ascend310 = std::make_shared<mindspore::Ascend310DeviceInfo>();
|
||||
ascend310->SetDeviceID(FLAGS_device_id);
|
||||
ascend310->SetPrecisionMode("allow_fp32_to_fp16");
|
||||
context->MutableDeviceInfo().push_back(ascend310);
|
||||
mindspore::Graph graph;
|
||||
Serialization::Load(FLAGS_mindir_path, ModelType::kMindIR, &graph);
|
||||
|
||||
Model model;
|
||||
Status ret = model.Build(GraphCell(graph), context);
|
||||
if (ret != kSuccess) {
|
||||
std::cout << "ERROR: Build failed." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
std::vector<MSTensor> model_inputs = model.GetInputs();
|
||||
|
||||
auto all_files = GetAllFiles(FLAGS_dataset_path);
|
||||
if (all_files.empty()) {
|
||||
std::cout << "ERROR: no input data." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
|
||||
std::map<double, double> costTime_map;
|
||||
size_t size = all_files.size();
|
||||
std::shared_ptr<TensorTransform> decode(new Decode());
|
||||
Execute composeDecode({decode});
|
||||
std::shared_ptr<TensorTransform> hwc2chw(new HWC2CHW());
|
||||
Execute composeTranspose({hwc2chw});
|
||||
std::shared_ptr<TensorTransform> typeCast(new TypeCast(DataType::kNumberTypeFloat16));
|
||||
Execute transformCast(typeCast);
|
||||
|
||||
for (size_t i = 0; i < size; ++i) {
|
||||
struct timeval start = {0};
|
||||
struct timeval end = {0};
|
||||
double startTimeMs;
|
||||
double endTimeMs;
|
||||
std::vector<MSTensor> inputs;
|
||||
std::vector<MSTensor> outputs;
|
||||
std::cout << "Start predict input files:" << all_files[i] << std::endl;
|
||||
auto imgDecode = MSTensor();
|
||||
auto image = ReadFileToTensor(all_files[i]);
|
||||
composeDecode(image, &imgDecode);
|
||||
|
||||
auto imgPad = MSTensor();
|
||||
PadImage(imgDecode, &imgPad);
|
||||
auto img = MSTensor();
|
||||
composeTranspose(imgPad, &img);
|
||||
transformCast(img, &img);
|
||||
|
||||
std::vector<int64_t> shape = imgDecode.Shape();
|
||||
|
||||
float widthScale = static_cast<float>(IMAGEWIDTH) / shape[1];
|
||||
float heightScale = static_cast<float>(IMAGEHEIGHT) / shape[0];
|
||||
float resizeScale = widthScale < heightScale ? widthScale : heightScale;
|
||||
|
||||
float imgInfo[4];
|
||||
imgInfo[0] = shape[0];
|
||||
imgInfo[1] = shape[1];
|
||||
imgInfo[2] = resizeScale;
|
||||
imgInfo[3] = resizeScale;
|
||||
|
||||
MSTensor imgMeta("imgMeta", DataType::kNumberTypeFloat32, {static_cast<int64_t>(4)}, imgInfo, 16);
|
||||
transformCast(imgMeta, &imgMeta);
|
||||
|
||||
inputs.emplace_back(model_inputs[0].Name(), model_inputs[0].DataType(), model_inputs[0].Shape(),
|
||||
img.Data().get(), img.DataSize());
|
||||
inputs.emplace_back(model_inputs[1].Name(), model_inputs[1].DataType(), model_inputs[1].Shape(),
|
||||
imgMeta.Data().get(), imgMeta.DataSize());
|
||||
|
||||
gettimeofday(&start, nullptr);
|
||||
ret = model.Predict(inputs, &outputs);
|
||||
gettimeofday(&end, nullptr);
|
||||
if (ret != kSuccess) {
|
||||
std::cout << "Predict " << all_files[i] << " failed." << std::endl;
|
||||
return 1;
|
||||
}
|
||||
startTimeMs = (1.0 * start.tv_sec * 1000000 + start.tv_usec) / 1000;
|
||||
endTimeMs = (1.0 * end.tv_sec * 1000000 + end.tv_usec) / 1000;
|
||||
costTime_map.insert(std::pair<double, double>(startTimeMs, endTimeMs));
|
||||
WriteResult(all_files[i], outputs);
|
||||
}
|
||||
double average = 0.0;
|
||||
int inferCount = 0;
|
||||
|
||||
for (auto iter = costTime_map.begin(); iter != costTime_map.end(); iter++) {
|
||||
double diff = 0.0;
|
||||
diff = iter->second - iter->first;
|
||||
average += diff;
|
||||
inferCount++;
|
||||
}
|
||||
average = average / inferCount;
|
||||
std::stringstream timeCost;
|
||||
timeCost << "NN inference cost average time: "<< average << " ms of infer_count " << inferCount << std::endl;
|
||||
std::cout << "NN inference cost average time: "<< average << "ms of infer_count " << inferCount << std::endl;
|
||||
|
||||
std::string fileName = "./time_Result" + std::string("/test_perform_static.txt");
|
||||
std::ofstream fileStream(fileName.c_str(), std::ios::trunc);
|
||||
fileStream << timeCost.str();
|
||||
fileStream.close();
|
||||
costTime_map.clear();
|
||||
return 0;
|
||||
}
|
|
@ -1,132 +0,0 @@
|
|||
/*
|
||||
* Copyright (c) 2020.Huawei Technologies Co., Ltd. All rights reserved.
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
#include <dirent.h>
|
||||
#include <sys/stat.h>
|
||||
#include <gflags/gflags.h>
|
||||
#include <unistd.h>
|
||||
#include <cstring>
|
||||
#include <fstream>
|
||||
#include <sstream>
|
||||
#include "../inc/AclProcess.h"
|
||||
#include "../inc/CommonDataType.h"
|
||||
|
||||
DEFINE_string(om_path, "./maskrcnn.om", "om model path.");
|
||||
DEFINE_string(data_path, "./test.jpg", "om model path.");
|
||||
DEFINE_int32(width, 1280, "width");
|
||||
DEFINE_int32(height, 768, "height");
|
||||
DEFINE_int32(device_id, 0, "height");
|
||||
|
||||
static bool is_file(const std::string &filename) {
|
||||
struct stat buffer;
|
||||
return (stat(filename.c_str(), &buffer) == 0 && S_ISREG(buffer.st_mode));
|
||||
}
|
||||
|
||||
static bool is_dir(const std::string &filefodler) {
|
||||
struct stat buffer;
|
||||
return (stat(filefodler.c_str(), &buffer) == 0 && S_ISDIR(buffer.st_mode));
|
||||
}
|
||||
/*
|
||||
* @description Initialize and run AclProcess module
|
||||
* @param resourceInfo resource info of deviceIds, model info, single Operator Path, etc
|
||||
* @param file the absolute path of input file
|
||||
* @return int int code
|
||||
*/
|
||||
int main(int argc, char* argv[]) {
|
||||
gflags::ParseCommandLineFlags(&argc, &argv, true);
|
||||
std::cout << "OM File Path :" << FLAGS_om_path << std::endl;
|
||||
std::cout << "data Path :" << FLAGS_data_path << std::endl;
|
||||
std::cout << "width :" << FLAGS_width << std::endl;
|
||||
std::cout << "height :" << FLAGS_height << std::endl;
|
||||
std::cout << "deviceId :" << FLAGS_device_id << std::endl;
|
||||
|
||||
char omAbsPath[PATH_MAX];
|
||||
if (realpath(FLAGS_om_path.c_str(), omAbsPath) == nullptr) {
|
||||
std::cout << "Failed to get the om real path." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
|
||||
if (access(omAbsPath, R_OK) == -1) {
|
||||
std::cout << "ModelPath " << omAbsPath << " doesn't exist or read failed." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
|
||||
char dataAbsPath[PATH_MAX];
|
||||
if (realpath(FLAGS_data_path.c_str(), dataAbsPath) == nullptr) {
|
||||
std::cout << "Failed to get the data real path." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
if (access(dataAbsPath, R_OK) == -1) {
|
||||
std::cout << "data paeh " << dataAbsPath << " doesn't exist or read failed." << std::endl;
|
||||
return INVALID_PARAM;
|
||||
}
|
||||
|
||||
std::map<double, double> costTime_map;
|
||||
AclProcess aclProcess(FLAGS_device_id, FLAGS_om_path, FLAGS_width, FLAGS_height);
|
||||
int ret = aclProcess.InitResource();
|
||||
if (ret != OK) {
|
||||
aclProcess.Release();
|
||||
return ret;
|
||||
}
|
||||
if (is_file(FLAGS_data_path)) {
|
||||
ret = aclProcess.Process(FLAGS_data_path, &costTime_map);
|
||||
if (ret != OK) {
|
||||
std::cout << "model process failed, errno = " << ret << std::endl;
|
||||
return ret;
|
||||
}
|
||||
} else if (is_dir(FLAGS_data_path)) {
|
||||
struct dirent *filename;
|
||||
DIR *dir;
|
||||
dir = opendir(FLAGS_data_path.c_str());
|
||||
if (dir == nullptr) {
|
||||
return ERROR;
|
||||
}
|
||||
|
||||
while ((filename = readdir(dir)) != nullptr) {
|
||||
if (strcmp(filename->d_name, ".") == 0 || strcmp(filename->d_name, "..") == 0) {
|
||||
continue;
|
||||
}
|
||||
std::string wholePath = FLAGS_data_path + "/" + filename->d_name;
|
||||
ret = aclProcess.Process(wholePath, &costTime_map);
|
||||
if (ret != OK) {
|
||||
std::cout << "model process failed, errno = " << ret << std::endl;
|
||||
return ret;
|
||||
}
|
||||
}
|
||||
} else {
|
||||
std::cout << " input image path error" << std::endl;
|
||||
}
|
||||
|
||||
double average = 0.0;
|
||||
int infer_cnt = 0;
|
||||
|
||||
for (auto iter = costTime_map.begin(); iter != costTime_map.end(); iter++) {
|
||||
double diff = 0.0;
|
||||
diff = iter->second - iter->first;
|
||||
average += diff;
|
||||
infer_cnt++;
|
||||
}
|
||||
average = average / infer_cnt;
|
||||
std::stringstream timeCost;
|
||||
timeCost << "NN inference cost average time: "<< average << " ms of infer_count " << infer_cnt << std::endl;
|
||||
std::cout << "NN inference cost average time: "<< average << "ms of infer_count " << infer_cnt << std::endl;
|
||||
std::string file_name = "./time_Result" + std::string("/test_perform_static.txt");
|
||||
std::ofstream file_stream(file_name.c_str(), std::ios::trunc);
|
||||
file_stream << timeCost.str();
|
||||
file_stream.close();
|
||||
costTime_map.clear();
|
||||
|
||||
aclProcess.Release();
|
||||
return OK;
|
||||
}
|
|
@ -0,0 +1,129 @@
|
|||
/**
|
||||
* Copyright 2021 Huawei Technologies Co., Ltd
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#include <fstream>
|
||||
#include <algorithm>
|
||||
#include <iostream>
|
||||
#include "../inc/utils.h"
|
||||
|
||||
using mindspore::MSTensor;
|
||||
using mindspore::DataType;
|
||||
|
||||
std::vector<std::string> GetAllFiles(std::string_view dirName) {
|
||||
struct dirent *filename;
|
||||
DIR *dir = OpenDir(dirName);
|
||||
if (dir == nullptr) {
|
||||
return {};
|
||||
}
|
||||
std::vector<std::string> res;
|
||||
while ((filename = readdir(dir)) != nullptr) {
|
||||
std::string dName = std::string(filename->d_name);
|
||||
if (dName == "." || dName == ".." || filename->d_type != DT_REG) {
|
||||
continue;
|
||||
}
|
||||
res.emplace_back(std::string(dirName) + "/" + filename->d_name);
|
||||
}
|
||||
std::sort(res.begin(), res.end());
|
||||
for (auto &f : res) {
|
||||
std::cout << "image file: " << f << std::endl;
|
||||
}
|
||||
return res;
|
||||
}
|
||||
|
||||
int WriteResult(const std::string& imageFile, const std::vector<MSTensor> &outputs) {
|
||||
std::string homePath = "./result_Files";
|
||||
for (size_t i = 0; i < outputs.size(); ++i) {
|
||||
size_t outputSize;
|
||||
std::shared_ptr<const void> netOutput;
|
||||
netOutput = outputs[i].Data();
|
||||
outputSize = outputs[i].DataSize();
|
||||
int pos = imageFile.rfind('/');
|
||||
std::string fileName(imageFile, pos + 1);
|
||||
fileName.replace(fileName.find('.'), fileName.size() - fileName.find('.'), '_' + std::to_string(i) + ".bin");
|
||||
std::string outFileName = homePath + "/" + fileName;
|
||||
FILE * outputFile = fopen(outFileName.c_str(), "wb");
|
||||
fwrite(netOutput.get(), outputSize, sizeof(char), outputFile);
|
||||
fclose(outputFile);
|
||||
outputFile = nullptr;
|
||||
}
|
||||
return 0;
|
||||
}
|
||||
|
||||
MSTensor ReadFileToTensor(const std::string &file) {
|
||||
if (file.empty()) {
|
||||
std::cout << "Pointer file is nullptr" << std::endl;
|
||||
return MSTensor();
|
||||
}
|
||||
|
||||
std::ifstream ifs(file);
|
||||
if (!ifs.good()) {
|
||||
std::cout << "File: " << file << " is not exist" << std::endl;
|
||||
return MSTensor();
|
||||
}
|
||||
|
||||
if (!ifs.is_open()) {
|
||||
std::cout << "File: " << file << "open failed" << std::endl;
|
||||
return MSTensor();
|
||||
}
|
||||
|
||||
ifs.seekg(0, std::ios::end);
|
||||
size_t size = ifs.tellg();
|
||||
MSTensor buffer(file, mindspore::DataType::kNumberTypeUInt8, {static_cast<int64_t>(size)}, nullptr, size);
|
||||
|
||||
ifs.seekg(0, std::ios::beg);
|
||||
ifs.read(reinterpret_cast<char *>(buffer.MutableData()), size);
|
||||
ifs.close();
|
||||
|
||||
return buffer;
|
||||
}
|
||||
|
||||
|
||||
DIR *OpenDir(std::string_view dirName) {
|
||||
if (dirName.empty()) {
|
||||
std::cout << " dirName is null ! " << std::endl;
|
||||
return nullptr;
|
||||
}
|
||||
std::string realPath = RealPath(dirName);
|
||||
struct stat s;
|
||||
lstat(realPath.c_str(), &s);
|
||||
if (!S_ISDIR(s.st_mode)) {
|
||||
std::cout << "dirName is not a valid directory !" << std::endl;
|
||||
return nullptr;
|
||||
}
|
||||
DIR *dir;
|
||||
dir = opendir(realPath.c_str());
|
||||
if (dir == nullptr) {
|
||||
std::cout << "Can not open dir " << dirName << std::endl;
|
||||
return nullptr;
|
||||
}
|
||||
std::cout << "Successfully opened the dir " << dirName << std::endl;
|
||||
return dir;
|
||||
}
|
||||
|
||||
std::string RealPath(std::string_view path) {
|
||||
char realPathMem[PATH_MAX] = {0};
|
||||
char *realPathRet = nullptr;
|
||||
realPathRet = realpath(path.data(), realPathMem);
|
||||
|
||||
if (realPathRet == nullptr) {
|
||||
std::cout << "File: " << path << " is not exist.";
|
||||
return "";
|
||||
}
|
||||
|
||||
std::string realPath(realPathMem);
|
||||
std::cout << path << " realpath is: " << realPath << std::endl;
|
||||
return realPath;
|
||||
}
|
|
@ -13,6 +13,7 @@
|
|||
# limitations under the License.
|
||||
# ============================================================================
|
||||
"""post process for 310 inference"""
|
||||
import os
|
||||
import argparse
|
||||
import numpy as np
|
||||
from PIL import Image
|
||||
|
@ -27,6 +28,7 @@ dst_height = 768
|
|||
parser = argparse.ArgumentParser(description="maskrcnn inference")
|
||||
parser.add_argument("--ann_file", type=str, required=True, help="ann file.")
|
||||
parser.add_argument("--img_path", type=str, required=True, help="image file path.")
|
||||
parser.add_argument("--result_path", type=str, required=True, help="result file path.")
|
||||
args = parser.parse_args()
|
||||
|
||||
def get_img_size(file_name):
|
||||
|
@ -41,10 +43,10 @@ def get_resize_ratio(img_size):
|
|||
|
||||
return resize_ratio
|
||||
|
||||
def get_eval_result(ann_file, img_path):
|
||||
def get_eval_result(ann_file, img_path, result_path):
|
||||
""" Get metrics result according to the annotation file and result file"""
|
||||
max_num = 128
|
||||
result_path = "./result_Files/"
|
||||
result_path = result_path
|
||||
outputs = []
|
||||
|
||||
dataset_coco = COCO(ann_file)
|
||||
|
@ -52,16 +54,16 @@ def get_eval_result(ann_file, img_path):
|
|||
|
||||
for img_id in img_ids:
|
||||
file_id = str(img_id).zfill(12)
|
||||
file = img_path + "/" + file_id + ".jpg"
|
||||
file = os.path.join(img_path, file_id + ".jpg")
|
||||
img_size = get_img_size(file)
|
||||
resize_ratio = get_resize_ratio(img_size)
|
||||
|
||||
img_metas = np.array([img_size[1], img_size[0]] + [resize_ratio, resize_ratio])
|
||||
|
||||
bbox_result_file = result_path + file_id + "_0.bin"
|
||||
label_result_file = result_path + file_id + "_1.bin"
|
||||
mask_result_file = result_path + file_id + "_2.bin"
|
||||
mask_fb_result_file = result_path + file_id + "_3.bin"
|
||||
bbox_result_file = os.path.join(result_path, file_id + "_0.bin")
|
||||
label_result_file = os.path.join(result_path, file_id + "_1.bin")
|
||||
mask_result_file = os.path.join(result_path, file_id + "_2.bin")
|
||||
mask_fb_result_file = os.path.join(result_path, file_id + "_3.bin")
|
||||
|
||||
all_bbox = np.fromfile(bbox_result_file, dtype=np.float16).reshape(80000, 5)
|
||||
all_label = np.fromfile(label_result_file, dtype=np.int32).reshape(80000, 1)
|
||||
|
@ -94,4 +96,4 @@ def get_eval_result(ann_file, img_path):
|
|||
coco_eval(result_files, eval_types, dataset_coco, single_result=False)
|
||||
|
||||
if __name__ == '__main__':
|
||||
get_eval_result(args.ann_file, args.img_path)
|
||||
get_eval_result(args.ann_file, args.img_path, args.result_path)
|
||||
|
|
|
@ -15,59 +15,50 @@
|
|||
# ============================================================================
|
||||
|
||||
if [[ $# -lt 3 || $# -gt 4 ]]; then
|
||||
echo "Usage: sh run_infer_310.sh [AIR_PATH] [DATA_PATH] [ANN_FILE_PATH] [DEVICE_ID]
|
||||
echo "Usage: bash run_infer_310.sh [MINDIR_PATH] [DATA_PATH] [ANN_FILE] [DEVICE_ID]
|
||||
DEVICE_ID is optional, it can be set by environment variable device_id, otherwise the value is zero"
|
||||
exit 1
|
||||
fi
|
||||
|
||||
get_real_path(){
|
||||
if [ "${1:0:1}" == "/" ]; then
|
||||
echo "$1"
|
||||
else
|
||||
echo "$(realpath -m $PWD/$1)"
|
||||
fi
|
||||
if [ "${1:0:1}" == "/" ]; then
|
||||
echo "$1"
|
||||
else
|
||||
echo "$(realpath -m $PWD/$1)"
|
||||
fi
|
||||
}
|
||||
model=$(get_real_path $1)
|
||||
data_path=$(get_real_path $2)
|
||||
ann_file=$(get_real_path $3)
|
||||
|
||||
device_id=0
|
||||
if [ $# == 4 ]; then
|
||||
device_id=$4
|
||||
elif [ $# == 3 ]; then
|
||||
if [ -z $device_id ]; then
|
||||
device_id=0
|
||||
else
|
||||
device_id=$device_id
|
||||
fi
|
||||
fi
|
||||
|
||||
echo $model
|
||||
echo $data_path
|
||||
echo $ann_file
|
||||
echo $device_id
|
||||
echo "mindir name: "$model
|
||||
echo "dataset path: "$data_path
|
||||
echo "ann file: "$ann_file
|
||||
echo "device id: "$device_id
|
||||
|
||||
export ASCEND_HOME=/usr/local/Ascend/
|
||||
if [ -d ${ASCEND_HOME}/ascend-toolkit ]; then
|
||||
export PATH=$ASCEND_HOME/ascend-toolkit/latest/fwkacllib/ccec_compiler/bin:$ASCEND_HOME/ascend-toolkit/latest/atc/bin:$PATH
|
||||
export LD_LIBRARY_PATH=/usr/local/lib:$ASCEND_HOME/ascend-toolkit/latest/atc/lib64:$ASCEND_HOME/ascend-toolkit/latest/acllib/lib64:$ASCEND_HOME/ascend-toolkit/latest/fwkacllib/lib64:$ASCEND_HOME/driver/lib64:$ASCEND_HOME/add-ones:$LD_LIBRARY_PATH
|
||||
export TBE_IMPL_PATH=${ASCEND_HOME}/ascend-toolkit/latest/opp/op_impl/built-in/ai_core/tbe
|
||||
export LD_LIBRARY_PATH=/usr/local/lib:$ASCEND_HOME/ascend-toolkit/latest/atc/lib64:$ASCEND_HOME/ascend-toolkit/latest/acllib/lib64:$ASCEND_HOME/ascend-toolkit/latest/fwkacllib/lib64:$ASCEND_HOME/driver/lib64:$ASCEND_HOME/add-ons:$LD_LIBRARY_PATH
|
||||
export TBE_IMPL_PATH=$ASCEND_HOME/ascend-toolkit/latest/opp/op_impl/built-in/ai_core/tbe
|
||||
export PYTHONPATH=${TBE_IMPL_PATH}:$ASCEND_HOME/ascend-toolkit/latest/fwkacllib/python/site-packages:$PYTHONPATH
|
||||
export ASCEND_OPP_PATH=$ASCEND_HOME/ascend-toolkit/latest/opp
|
||||
else
|
||||
export PATH=$ASCEND_HOME/atc/ccec_compiler/bin:$ASCEND_HOME/atc/bin:$PATH
|
||||
export LD_LIBRARY_PATH=/usr/local/lib:$ASCEND_HOME/atc/lib64:$ASCEND_HOME/acllib/lib64:$ASCEND_HOME/driver/lib64:$ASCEND_HOME/add-ones:$LD_LIBRARY_PATH
|
||||
export LD_LIBRARY_PATH=/usr/local/lib:$ASCEND_HOME/atc/lib64:$ASCEND_HOME/acllib/lib64:$ASCEND_HOME/driver/lib64:$ASCEND_HOME/add-ons:$LD_LIBRARY_PATH
|
||||
export PYTHONPATH=$ASCEND_HOME/atc/python/site-packages:$PYTHONPATH
|
||||
export ASCEND_OPP_PATH=$ASCEND_HOME/opp
|
||||
fi
|
||||
|
||||
function air_to_om()
|
||||
{
|
||||
atc --input_format=NCHW --framework=1 --model=$model --input_shape="x:1, 3, 768, 1280; im_info: 1, 4" --output=maskrcnn --insert_op_conf=../src/aipp.cfg --precision_mode=allow_fp32_to_fp16 --soc_version=Ascend310 &>atc.log
|
||||
}
|
||||
|
||||
function compile_app()
|
||||
{
|
||||
cd ../ascend310_infer/src || exit
|
||||
sh build.sh &> build.log
|
||||
cd ../ascend310_infer || exit
|
||||
bash build.sh &> build.log
|
||||
cd - || exit
|
||||
}
|
||||
|
||||
|
@ -76,24 +67,19 @@ function infer()
|
|||
if [ -d result_Files ]; then
|
||||
rm -rf ./result_Files
|
||||
fi
|
||||
if [ -d time_Result ]; then
|
||||
if [ -d time_Result ]; then
|
||||
rm -rf ./time_Result
|
||||
fi
|
||||
mkdir result_Files
|
||||
mkdir time_Result
|
||||
../ascend310_infer/src/out/main --om_path=./maskrcnn.om --data_path=$data_path --device_id=$device_id &> infer.log
|
||||
../ascend310_infer/out/main --mindir_path=$model --dataset_path=$data_path --device_id=$device_id &> infer.log
|
||||
}
|
||||
|
||||
function cal_acc()
|
||||
{
|
||||
python ../postprocess.py --ann_file=$ann_file --img_path=$data_path &> acc.log &
|
||||
python3.7 ../postprocess.py --ann_file=$ann_file --img_path=$data_path --result_path=./result_Files &> acc.log &
|
||||
}
|
||||
|
||||
air_to_om
|
||||
if [ $? -ne 0 ]; then
|
||||
echo "air to om failed"
|
||||
exit 1
|
||||
fi
|
||||
compile_app
|
||||
if [ $? -ne 0 ]; then
|
||||
echo "compile app code failed"
|
||||
|
|
|
@ -1,26 +0,0 @@
|
|||
aipp_op {
|
||||
aipp_mode : static
|
||||
input_format : YUV420SP_U8
|
||||
related_input_rank : 0
|
||||
csc_switch : true
|
||||
rbuv_swap_switch : false
|
||||
matrix_r0c0 : 256
|
||||
matrix_r0c1 : 0
|
||||
matrix_r0c2 : 359
|
||||
matrix_r1c0 : 256
|
||||
matrix_r1c1 : -88
|
||||
matrix_r1c2 : -183
|
||||
matrix_r2c0 : 256
|
||||
matrix_r2c1 : 454
|
||||
matrix_r2c2 : 0
|
||||
input_bias_0 : 0
|
||||
input_bias_1 : 128
|
||||
input_bias_2 : 128
|
||||
|
||||
mean_chn_0 : 124
|
||||
mean_chn_1 : 117
|
||||
mean_chn_2 : 104
|
||||
var_reci_chn_0 : 0.0171247538316637
|
||||
var_reci_chn_1 : 0.0175070028011204
|
||||
var_reci_chn_2 : 0.0174291938997821
|
||||
}
|
Loading…
Reference in New Issue