/******************************************************************************* * * MIT License * * Copyright (c) 2018 Advanced Micro Devices, Inc. * * Permission is hereby granted, free of charge, to any person obtaining a copy * of this software and associated documentation files (the "Software"), to deal * in the Software without restriction, including without limitation the rights * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell * copies of the Software, and to permit persons to whom the Software is * furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included in all * copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE * SOFTWARE. * *******************************************************************************/ #include "test.hpp" #include #include #include #include #include #include #include #include #include #include #include #include #include "driver.hpp" #include "get_handle.hpp" #include "tensor_holder.hpp" #include "verify.hpp" template struct verify_tensor_cast { miopen::TensorDescriptor srcDesc; miopen::TensorDescriptor dstDesc; tensor srcSuper; tensor dstSuper; int srcOffset; int dstOffset; float alpha; float max_val; verify_tensor_cast(const tensor& psrc_super, const tensor& pdst_super, const miopen::TensorDescriptor& psd, const miopen::TensorDescriptor& pdd, std::vector offsets, const float palpha, const float pmax_val) { srcDesc = psd; dstDesc = pdd; srcSuper = psrc_super; dstSuper = pdst_super; srcOffset = offsets[0]; dstOffset = offsets[1]; alpha = palpha; max_val = pmax_val; } void tensor_cast_for_loop(tensor& dstSuperCpu, int src_offset_index, int dst_offset_index, int dim) const { auto src_stride = srcDesc.GetStrides()[dim]; auto dst_stride = dstDesc.GetStrides()[dim]; for(int idx = 0; idx < srcDesc.GetLengths()[dim]; idx++) { std::size_t src_super_index = ((dim == 0) ? srcOffset : 0) + src_offset_index + src_stride * idx; std::size_t dst_super_index = ((dim == 0) ? dstOffset : 0) + dst_offset_index + dst_stride * idx; if(dim < (srcDesc.GetLengths().size() - 1)) { tensor_cast_for_loop(dstSuperCpu, src_super_index, dst_super_index, dim + 1); } if(dst_super_index < dstSuperCpu.desc.GetElementSpace() && src_super_index < srcSuper.desc.GetElementSpace()) { float temp_val = float(srcSuper[src_super_index]) * alpha; dstSuperCpu[dst_super_index] = T(temp_val >= max_val ? max_val : temp_val); } } } tensor cpu() const { tensor dstSuperCpu = dstSuper; tensor_cast_for_loop(dstSuperCpu, 0, 0, 0); return dstSuperCpu; } tensor gpu() const { tensor dstSuperGpu = dstSuper; auto&& handle = get_handle(); auto dstSuper_dev = handle.Write(dstSuperGpu.data); auto srcSuper_dev = handle.Write(srcSuper.data); miopen::CastTensor(handle, &alpha, srcDesc, srcSuper_dev.get(), dstDesc, dstSuper_dev.get(), srcOffset, dstOffset); dstSuperGpu.data = handle.Read(dstSuper_dev, dstSuperGpu.data.size()); return dstSuperGpu; } void fail(float = 0) { std::cout << "Tensor Cast: " << std::endl; std::cout << "src super-tensor: " << srcSuper.desc.ToString() << std::endl; std::cout << "dst super-tensor: " << dstSuper.desc.ToString() << std::endl; std::cout << "src sub-tensor: " << srcDesc.ToString() << std::endl; std::cout << "dst sub-tensor: " << dstDesc.ToString() << std::endl; } }; template struct tensor_cast_driver : test_driver { tensor srcSuper; tensor dstSuper; std::vector srcSuperLens; std::vector dstSuperLens; float alpha = 1.0; float max_val = 0.; miopen::TensorDescriptor srcDesc; miopen::TensorDescriptor dstDesc; std::vector castLens; std::vector offsets; tensor_cast_driver() { disabled_cache = true; std::vector src_lens = {32, 16, 32, 16, 16}; std::vector dst_lens = {32, 32, 16, 16, 16}; add(srcSuperLens, "srcSuperLens", generate_data({src_lens}, src_lens)); add(dstSuperLens, "dstSuperLens", generate_data({dst_lens}, dst_lens)); add(castLens, "castLens", generate_data(get_sub_tensor(), {32, 8, 10})); add(offsets, "offsets", generate_data(get_tensor_offsets(), {7, 11})); add(alpha, "alpha", generate_data({1.0 / 127 / 127, 1.0 / 127, 127.0, 1.0})); } void run() { unsigned long max_value = miopen_type{} == miopenHalf ? 5 : 32767; max_val = miopen_type{} == miopenHalf ? 65504.0 : miopen_type{} == miopenInt8 ? 127.0 : miopen_type{} == miopenInt32 ? 2147483647.0 : 3.402823466e+38F; srcSuper = tensor{srcSuperLens}.generate(tensor_elem_gen_integer{max_value}); dstSuper = tensor{dstSuperLens}.generate(tensor_elem_gen_integer{max_value}); std::vector srcSuperStrides = srcSuper.desc.GetStrides(); std::vector dstSuperStrides = dstSuper.desc.GetStrides(); std::vector src_super_strides(srcSuperStrides.begin() + (srcSuper.desc.GetSize() - castLens.size()), srcSuperStrides.end()); std::vector dst_super_strides(dstSuperStrides.begin() + (dstSuper.desc.GetSize() - castLens.size()), dstSuperStrides.end()); srcDesc = miopen::TensorDescriptor( miopenInt32, castLens.data(), src_super_strides.data(), castLens.size()); dstDesc = miopen::TensorDescriptor( miopen_type{}, castLens.data(), dst_super_strides.data(), castLens.size()); if(srcDesc.GetLengths().size() == dstDesc.GetLengths().size()) { verify_equals(verify_tensor_cast{ srcSuper, dstSuper, srcDesc, dstDesc, offsets, alpha, max_val}); } } }; int main(int argc, const char* argv[]) { test_drive(argc, argv); }