58 Star 283 Fork 3

腾讯开源/ncnn

加入 Gitee
与超过 1200万 开发者一起发现、参与优秀开源项目,私有仓库也完全免费 :)
免费加入
文件
克隆/下载
test_command.cpp 5.71 KB
一键复制 编辑 原始数据 按行查看 历史
// Copyright 2021 Tencent
// SPDX-License-Identifier: BSD-3-Clause
#include "command.h"
#include "gpu.h"
#include "mat.h"
#include "testutil.h"
static int test_command_upload_download(const ncnn::Mat& a)
{
ncnn::VulkanDevice* vkdev = ncnn::get_gpu_device();
ncnn::VkAllocator* blob_allocator = vkdev->acquire_blob_allocator();
ncnn::VkAllocator* staging_allocator = vkdev->acquire_staging_allocator();
ncnn::Option opt;
opt.num_threads = 1;
opt.use_vulkan_compute = true;
opt.blob_vkallocator = blob_allocator;
opt.staging_vkallocator = staging_allocator;
if (!vkdev->info.support_fp16_packed()) opt.use_fp16_packed = false;
if (!vkdev->info.support_fp16_storage()) opt.use_fp16_storage = false;
ncnn::Mat c;
{
ncnn::VkCompute cmd(vkdev);
ncnn::VkMat b;
cmd.record_upload(a, b, opt);
cmd.record_download(b, c, opt);
cmd.submit_and_wait();
}
vkdev->reclaim_blob_allocator(blob_allocator);
vkdev->reclaim_staging_allocator(staging_allocator);
if (CompareMat(a, c, 0.001) != 0)
{
fprintf(stderr, "test_command_upload_download image failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
return -1;
}
return 0;
}
static int test_command_clone(const ncnn::Mat& a)
{
ncnn::VulkanDevice* vkdev = ncnn::get_gpu_device();
ncnn::VkAllocator* blob_allocator = vkdev->acquire_blob_allocator();
ncnn::VkAllocator* staging_allocator = vkdev->acquire_staging_allocator();
ncnn::Option opt;
opt.num_threads = 1;
opt.use_vulkan_compute = true;
opt.blob_vkallocator = blob_allocator;
opt.staging_vkallocator = staging_allocator;
if (!vkdev->info.support_fp16_packed()) opt.use_fp16_packed = false;
if (!vkdev->info.support_fp16_storage()) opt.use_fp16_storage = false;
ncnn::Mat d;
ncnn::Mat e;
{
ncnn::VkCompute cmd(vkdev);
ncnn::VkMat b1;
ncnn::VkMat b2;
ncnn::VkImageMat b3;
ncnn::VkImageMat c1;
ncnn::VkImageMat c2;
ncnn::VkMat c3;
cmd.record_clone(a, b1, opt);
cmd.record_clone(a, c1, opt);
cmd.record_clone(b1, b2, opt);
cmd.record_clone(c1, c2, opt);
cmd.record_clone(b2, b3, opt);
cmd.record_clone(c2, c3, opt);
cmd.record_clone(b3, d, opt);
cmd.record_clone(c3, e, opt);
cmd.submit_and_wait();
}
vkdev->reclaim_blob_allocator(blob_allocator);
vkdev->reclaim_staging_allocator(staging_allocator);
if (CompareMat(a, d, 0.001) != 0)
{
fprintf(stderr, "test_command_clone buffer failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
return -1;
}
if (CompareMat(a, e, 0.001) != 0)
{
fprintf(stderr, "test_command_clone image failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
return -1;
}
return 0;
}
static int test_command_transfer(const ncnn::Mat& a)
{
ncnn::VulkanDevice* vkdev = ncnn::get_gpu_device();
ncnn::VkAllocator* blob_allocator = vkdev->acquire_blob_allocator();
ncnn::VkAllocator* staging_allocator = vkdev->acquire_staging_allocator();
ncnn::Option opt;
opt.num_threads = 1;
opt.use_vulkan_compute = true;
opt.blob_vkallocator = blob_allocator;
opt.staging_vkallocator = staging_allocator;
if (!vkdev->info.support_fp16_packed()) opt.use_fp16_packed = false;
if (!vkdev->info.support_fp16_storage()) opt.use_fp16_storage = false;
ncnn::Mat c;
{
ncnn::VkTransfer cmd1(vkdev);
ncnn::VkMat b;
cmd1.record_upload(a, b, opt, false);
cmd1.submit_and_wait();
ncnn::VkCompute cmd2(vkdev);
cmd2.record_download(b, c, opt);
cmd2.submit_and_wait();
}
vkdev->reclaim_blob_allocator(blob_allocator);
vkdev->reclaim_staging_allocator(staging_allocator);
if (CompareMat(a, c, 0.001) != 0)
{
fprintf(stderr, "test_command_transfer buffer failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
return -1;
}
return 0;
}
static int test_command_0()
{
return 0
|| test_command_upload_download(RandomMat(5, 7, 24))
|| test_command_upload_download(RandomMat(7, 9, 12))
|| test_command_upload_download(RandomMat(3, 5, 13))
|| test_command_upload_download(RandomMat(15, 24))
|| test_command_upload_download(RandomMat(19, 12))
|| test_command_upload_download(RandomMat(17, 15))
|| test_command_upload_download(RandomMat(128))
|| test_command_upload_download(RandomMat(124))
|| test_command_upload_download(RandomMat(127));
}
static int test_command_1()
{
return 0
|| test_command_clone(RandomMat(5, 7, 24))
|| test_command_clone(RandomMat(7, 9, 12))
|| test_command_clone(RandomMat(3, 5, 13))
|| test_command_clone(RandomMat(15, 24))
|| test_command_clone(RandomMat(19, 12))
|| test_command_clone(RandomMat(17, 15))
|| test_command_clone(RandomMat(128))
|| test_command_clone(RandomMat(124))
|| test_command_clone(RandomMat(127));
}
static int test_command_2()
{
return 0
|| test_command_transfer(RandomMat(5, 7, 24))
|| test_command_transfer(RandomMat(7, 9, 12))
|| test_command_transfer(RandomMat(3, 5, 13))
|| test_command_transfer(RandomMat(15, 24))
|| test_command_transfer(RandomMat(19, 12))
|| test_command_transfer(RandomMat(17, 15))
|| test_command_transfer(RandomMat(128))
|| test_command_transfer(RandomMat(124))
|| test_command_transfer(RandomMat(127));
}
int main()
{
SRAND(7767517);
return test_command_0() || test_command_1() || test_command_2();
}
Loading...
马建仓 AI 助手
尝试更多
代码解读
代码找茬
代码优化
C/C++
1
https://gitee.com/Tencent/ncnn.git
git@gitee.com:Tencent/ncnn.git
Tencent
ncnn
ncnn
master

搜索帮助