海思3559a從零開始做計算機視覺4

第四天

準備先將海思給的SSD的nnie的例子跑起來


SSD是原版的vgg16作爲主幹網絡的例子,官方給出的wk文件是已經經過轉化之後的

但是給的例子中讀取圖片是加載的bgr文件,這樣測試起來非常不方便,所以用opencv 重新寫了讀圖片的接口。

	IplImage *imgSrc = 0;
    imgSrc = cvLoadImage(pcSrcFile, 1);
        if (imgSrc == 0) {
        printf("Load image error\n");
        return -1;
    }
    //--resize to 300*300
    IplImage *img;
    CvSize dstSize;
    dstSize.height = 300;
    dstSize.width = 300;
    img = cvCreateImage(dstSize,imgSrc->depth,imgSrc->nChannels);
    cvResize(imgSrc,img,CV_INTER_CUBIC);

    HI_U8 *data = (HI_U8*)img->imageData;
    int step = img->widthStep;
    int h = img->height;
    int w = img->width;
    int c = img->nChannels;

    IplImage *bgrImg = 0;
    CvSize sz;
    sz.width = w;
    sz.height = h;
    bgrImg = cvCreateImage(sz,img->depth,img->nChannels);
    HI_U8* bgr = (HI_U8*)bgrImg->imageData;
    int offset = 0;
        //注意遍歷順序
    for (int k=0; k<c; k++) {
        for (int i=0; i<h; i++) {
            for(int j=0; j<w; j++) {
                bgr[offset] = data[i*step + j*c + k];
                offset++;
            }
        }
    }

這樣將jpg圖片轉爲了bgr格式圖片,然後將SAMPLE_SVP_NNIE_FillSrcData函數改寫了

static HI_S32 SAMPLE_SVP_NNIE_FillSrcDataFromFrame(HI_U8* pImage,
    SAMPLE_SVP_NNIE_PARAM_S *pstNnieParam, SAMPLE_SVP_NNIE_INPUT_DATA_INDEX_S* pstInputDataIdx)
{
    HI_U32 i =0, j = 0, n = 0;
    HI_U32 u32Height = 0, u32Width = 0, u32Chn = 0, u32Stride = 0, u32Dim = 0;
    HI_U32 u32VarSize = 0;
    HI_S32 s32Ret = HI_SUCCESS;
    HI_U8*pu8PicAddr = NULL;
    HI_U32*pu32StepAddr = NULL;
    HI_U32 u32SegIdx = pstInputDataIdx->u32SegIdx;
    HI_U32 u32NodeIdx = pstInputDataIdx->u32NodeIdx;
    HI_U32 u32TotalStepNum = 0;
	HI_U32 u32SrcPerLine = 0;

	if(NULL == pImage)
	{
		SAMPLE_SVP_CHECK_EXPR_GOTO(1 != s32Ret,FAIL,SAMPLE_SVP_ERR_LEVEL_ERROR,"Error, input image is NULL!\n");
	}

    /*get data size*/
    if(SVP_BLOB_TYPE_U8 <= pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].enType &&
        SVP_BLOB_TYPE_YVU422SP >= pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].enType)
    {
        u32VarSize = sizeof(HI_U8);
    }
    else
    {
        u32VarSize = sizeof(HI_U32);
    }

    /*fill src data*/
    if(SVP_BLOB_TYPE_SEQ_S32 == pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].enType)
    {
        u32Dim = pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].unShape.stSeq.u32Dim;
        u32Stride = pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].u32Stride;
        pu32StepAddr = (HI_U32*)(pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].unShape.stSeq.u64VirAddrStep);
        pu8PicAddr = (HI_U8*)(pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].u64VirAddr);

		u32SrcPerLine = u32Dim*u32VarSize;
		
        for(n = 0; n < pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].u32Num; n++)
        {
            for(i = 0;i < *(pu32StepAddr+n); i++)
            {
                //s32Ret = fread(pu8PicAddr,u32Dim*u32VarSize,1,fp);
                memcpy(pu8PicAddr,pImage,u32SrcPerLine);
                printf("mem copy\n");
				pImage += u32SrcPerLine;
                pu8PicAddr += u32Stride;
            }
            u32TotalStepNum += *(pu32StepAddr+n);
        }
        SAMPLE_COMM_SVP_FlushCache(pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].u64PhyAddr,
            (HI_VOID *) pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].u64VirAddr,
            u32TotalStepNum*u32Stride);
    }
    else
    {
        u32Height = pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].unShape.stWhc.u32Height;
        u32Width = pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].unShape.stWhc.u32Width;
        u32Chn = pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].unShape.stWhc.u32Chn;
        u32Stride = pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].u32Stride;
        pu8PicAddr = (HI_U8*)(pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].u64VirAddr);

		u32SrcPerLine = u32Width*u32VarSize;
        for(n = 0; n < pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].u32Num; n++)
        {
            for(i = 0;i < u32Chn; i++)
            {
                for(j = 0; j < u32Height; j++)
                {
                    //s32Ret = fread(pu8PicAddr,u32Width*u32VarSize,1,fp);
					memcpy(pu8PicAddr,pImage,u32SrcPerLine);
					pImage += u32SrcPerLine;
                    pu8PicAddr += u32Stride;
                }
            }
        }		
		
        SAMPLE_COMM_SVP_FlushCache(pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].u64PhyAddr,
            (HI_VOID *) pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].u64VirAddr,
            pstNnieParam->astSegData[u32SegIdx].astSrc[u32NodeIdx].u32Num*u32Chn*u32Height*u32Stride);
    }


    return HI_SUCCESS;
	
FAIL:
    return HI_FAILURE;
    
}

這樣就可以直接使用opencv讀圖片了。

sample中SSD的例子,在nnie下運行時間不太穩定,也不太快,根本沒法達到要求

所以接下來的事情就是自己訓練一個小網絡,轉nnie模型,爭取達到200fps。


關注我的公衆號,分享資源
公衆號搜索: 卡本特
掃碼關注
在這裏插入圖片描述

發表評論
所有評論
還沒有人評論,想成為第一個評論的人麼? 請在上方評論欄輸入並且點擊發布.
相關文章