// Tencent is pleased to support the open source community by making ncnn available. // // Copyright (C) 2021 THL A29 Limited, a Tencent company. All rights reserved. // // Licensed under the BSD 3-Clause License (the "License"); you may not use this file except // in compliance with the License. You may obtain a copy of the License at // // https://opensource.org/licenses/BSD-3-Clause // // Unless required by applicable law or agreed to in writing, software distributed // under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR // CONDITIONS OF ANY KIND, either express or implied. See the License for the // specific language governing permissions and limitations under the License. #include "command.h" #include "gpu.h" #include "mat.h" #include "testutil.h" static int test_command_upload_download(const ncnn::Mat& a) { ncnn::VulkanDevice* vkdev = ncnn::get_gpu_device(); ncnn::VkAllocator* blob_allocator = vkdev->acquire_blob_allocator(); ncnn::VkAllocator* staging_allocator = vkdev->acquire_staging_allocator(); ncnn::Option opt; opt.num_threads = 1; opt.use_vulkan_compute = true; opt.blob_vkallocator = blob_allocator; opt.staging_vkallocator = staging_allocator; if (!vkdev->info.support_fp16_packed()) opt.use_fp16_packed = false; if (!vkdev->info.support_fp16_storage()) opt.use_fp16_storage = false; ncnn::Mat d; ncnn::Mat e; { ncnn::VkCompute cmd(vkdev); ncnn::VkMat b1; ncnn::VkImageMat b2; ncnn::VkImageMat c1; ncnn::VkMat c2; cmd.record_upload(a, b1, opt); cmd.record_upload(a, c1, opt); cmd.record_buffer_to_image(b1, b2, opt); cmd.record_image_to_buffer(c1, c2, opt); cmd.record_download(b2, d, opt); cmd.record_download(c2, e, opt); cmd.submit_and_wait(); } vkdev->reclaim_blob_allocator(blob_allocator); vkdev->reclaim_staging_allocator(staging_allocator); if (CompareMat(a, d, 0.001) != 0) { fprintf(stderr, "test_command_upload_download buffer failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c); return -1; } if (CompareMat(a, e, 0.001) != 0) { fprintf(stderr, "test_command_upload_download image failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c); return -1; } return 0; } static int test_command_clone(const ncnn::Mat& a) { ncnn::VulkanDevice* vkdev = ncnn::get_gpu_device(); ncnn::VkAllocator* blob_allocator = vkdev->acquire_blob_allocator(); ncnn::VkAllocator* staging_allocator = vkdev->acquire_staging_allocator(); ncnn::Option opt; opt.num_threads = 1; opt.use_vulkan_compute = true; opt.blob_vkallocator = blob_allocator; opt.staging_vkallocator = staging_allocator; if (!vkdev->info.support_fp16_packed()) opt.use_fp16_packed = false; if (!vkdev->info.support_fp16_storage()) opt.use_fp16_storage = false; ncnn::Mat d; ncnn::Mat e; { ncnn::VkCompute cmd(vkdev); ncnn::VkMat b1; ncnn::VkMat b2; ncnn::VkImageMat b3; ncnn::VkImageMat c1; ncnn::VkImageMat c2; ncnn::VkMat c3; cmd.record_clone(a, b1, opt); cmd.record_clone(a, c1, opt); cmd.record_clone(b1, b2, opt); cmd.record_clone(c1, c2, opt); cmd.record_clone(b2, b3, opt); cmd.record_clone(c2, c3, opt); cmd.record_clone(b3, d, opt); cmd.record_clone(c3, e, opt); cmd.submit_and_wait(); } vkdev->reclaim_blob_allocator(blob_allocator); vkdev->reclaim_staging_allocator(staging_allocator); if (CompareMat(a, d, 0.001) != 0) { fprintf(stderr, "test_command_clone buffer failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c); return -1; } if (CompareMat(a, e, 0.001) != 0) { fprintf(stderr, "test_command_clone image failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c); return -1; } return 0; } static int test_command_transfer(const ncnn::Mat& a) { ncnn::VulkanDevice* vkdev = ncnn::get_gpu_device(); ncnn::VkAllocator* blob_allocator = vkdev->acquire_blob_allocator(); ncnn::VkAllocator* staging_allocator = vkdev->acquire_staging_allocator(); ncnn::Option opt; opt.num_threads = 1; opt.use_vulkan_compute = true; opt.blob_vkallocator = blob_allocator; opt.staging_vkallocator = staging_allocator; if (!vkdev->info.support_fp16_packed()) opt.use_fp16_packed = false; if (!vkdev->info.support_fp16_storage()) opt.use_fp16_storage = false; ncnn::Mat d; ncnn::Mat e; { ncnn::VkTransfer cmd1(vkdev); ncnn::VkMat b1; ncnn::VkImageMat c1; cmd1.record_upload(a, b1, opt, false); cmd1.record_upload(a, c1, opt); cmd1.submit_and_wait(); ncnn::VkCompute cmd2(vkdev); cmd2.record_download(b1, d, opt); cmd2.record_download(c1, e, opt); cmd2.submit_and_wait(); } vkdev->reclaim_blob_allocator(blob_allocator); vkdev->reclaim_staging_allocator(staging_allocator); if (CompareMat(a, d, 0.001) != 0) { fprintf(stderr, "test_command_transfer buffer failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c); return -1; } if (CompareMat(a, e, 0.001) != 0) { fprintf(stderr, "test_command_transfer image failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c); return -1; } return 0; } static int test_command_0() { return 0 || test_command_upload_download(RandomMat(5, 7, 24)) || test_command_upload_download(RandomMat(7, 9, 12)) || test_command_upload_download(RandomMat(3, 5, 13)) || test_command_upload_download(RandomMat(15, 24)) || test_command_upload_download(RandomMat(19, 12)) || test_command_upload_download(RandomMat(17, 15)) || test_command_upload_download(RandomMat(128)) || test_command_upload_download(RandomMat(124)) || test_command_upload_download(RandomMat(127)); } static int test_command_1() { return 0 || test_command_clone(RandomMat(5, 7, 24)) || test_command_clone(RandomMat(7, 9, 12)) || test_command_clone(RandomMat(3, 5, 13)) || test_command_clone(RandomMat(15, 24)) || test_command_clone(RandomMat(19, 12)) || test_command_clone(RandomMat(17, 15)) || test_command_clone(RandomMat(128)) || test_command_clone(RandomMat(124)) || test_command_clone(RandomMat(127)); } static int test_command_2() { return 0 || test_command_transfer(RandomMat(5, 7, 24)) || test_command_transfer(RandomMat(7, 9, 12)) || test_command_transfer(RandomMat(3, 5, 13)) || test_command_transfer(RandomMat(15, 24)) || test_command_transfer(RandomMat(19, 12)) || test_command_transfer(RandomMat(17, 15)) || test_command_transfer(RandomMat(128)) || test_command_transfer(RandomMat(124)) || test_command_transfer(RandomMat(127)); } int main() { SRAND(7767517); return test_command_0() || test_command_1() || test_command_2(); }