CL/UNIT/Multithreaded.cpp

*c217d954SCole Faust/*
*c217d954SCole Faust * Copyright (c) 2022 Arm Limited.
*c217d954SCole Faust *
*c217d954SCole Faust * SPDX-License-Identifier: MIT
*c217d954SCole Faust *
*c217d954SCole Faust * Permission is hereby granted, free of charge, to any person obtaining a copy
*c217d954SCole Faust * of this software and associated documentation files (the "Software"), to
*c217d954SCole Faust * deal in the Software without restriction, including without limitation the
*c217d954SCole Faust * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
*c217d954SCole Faust * sell copies of the Software, and to permit persons to whom the Software is
*c217d954SCole Faust * furnished to do so, subject to the following conditions:
*c217d954SCole Faust *
*c217d954SCole Faust * The above copyright notice and this permission notice shall be included in all
*c217d954SCole Faust * copies or substantial portions of the Software.
*c217d954SCole Faust *
*c217d954SCole Faust * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
*c217d954SCole Faust * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
*c217d954SCole Faust * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
*c217d954SCole Faust * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
*c217d954SCole Faust * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
*c217d954SCole Faust * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
*c217d954SCole Faust * SOFTWARE.
*c217d954SCole Faust */
*c217d954SCole Faust#include "arm_compute/runtime/RuntimeContext.h"
*c217d954SCole Faust
*c217d954SCole Faust#include "tests/CL/CLAccessor.h"
*c217d954SCole Faust#include "tests/framework/Macros.h"
*c217d954SCole Faust#include "tests/framework/ParametersLibrary.h"
*c217d954SCole Faust#include "tests/validation/Validation.h"
*c217d954SCole Faust#include "arm_compute/runtime/CL/functions/CLActivationLayer.h"
*c217d954SCole Faust#include "arm_compute/runtime/CL/functions/CLPixelWiseMultiplication.h"
*c217d954SCole Faust#include "tests/validation/reference/ActivationLayer.h"
*c217d954SCole Faust#include "tests/validation/reference/PixelWiseMultiplication.h"
*c217d954SCole Faust#include <thread>
*c217d954SCole Faust
*c217d954SCole Faustnamespace arm_compute
*c217d954SCole Faust{
*c217d954SCole Faustnamespace test
*c217d954SCole Faust{
*c217d954SCole Faustnamespace validation
*c217d954SCole Faust{
*c217d954SCole FaustTEST_SUITE(CL)
*c217d954SCole FaustTEST_SUITE(UNIT)
*c217d954SCole FaustTEST_SUITE(RuntimeContext)
*c217d954SCole Faust// This test tries scheduling work concurrently from two independent threads
*c217d954SCole FaustTEST_CASE(MultipleThreadedScheduller, framework::DatasetMode::ALL)
*c217d954SCole Faust{
*c217d954SCole Faust    constexpr auto num_threads(16u);
*c217d954SCole Faust    std::array<CLActivationLayer, num_threads>         func{};
*c217d954SCole Faust    std::array<CLPixelWiseMultiplication, num_threads> pmul{};
*c217d954SCole Faust    std::array<CLTensor, num_threads>                  s0{};
*c217d954SCole Faust    std::array<CLTensor, num_threads>                  s1{};
*c217d954SCole Faust
*c217d954SCole Faust    std::array<CLTensor, num_threads> st{};
*c217d954SCole Faust    std::array<CLTensor, num_threads> dt{};
*c217d954SCole Faust
*c217d954SCole Faust    const TensorShape         tensor_shape(128u, 4u, 5u);
*c217d954SCole Faust    const ActivationLayerInfo ainfo(ActivationLayerInfo::ActivationFunction::LOGISTIC, 0.5f, 1.f);
*c217d954SCole Faust    std::array<std::thread, num_threads> threads;
*c217d954SCole Faust    auto ctx = parameters->get_ctx<CLTensor>();
*c217d954SCole Faust
*c217d954SCole Faust    for(auto i = 0u; i < num_threads; ++i)
*c217d954SCole Faust    {
*c217d954SCole Faust        s0[i]   = create_tensor<CLTensor>(tensor_shape, DataType::F32, 1);
*c217d954SCole Faust        s1[i]   = create_tensor<CLTensor>(tensor_shape, DataType::F32, 1);
*c217d954SCole Faust        st[i]   = create_tensor<CLTensor>(tensor_shape, DataType::F32, 1);
*c217d954SCole Faust        dt[i]   = create_tensor<CLTensor>(tensor_shape, DataType::F32, 1);
*c217d954SCole Faust        func[i] = CLActivationLayer(ctx);
*c217d954SCole Faust        pmul[i] = CLPixelWiseMultiplication();
*c217d954SCole Faust        threads[i] =
*c217d954SCole Faust            std::thread([&,i]
*c217d954SCole Faust        {
*c217d954SCole Faust            auto &s  = st[i];
*c217d954SCole Faust            auto &t  = dt[i];
*c217d954SCole Faust            auto &p0 = s0[i];
*c217d954SCole Faust            auto &p1 = s1[i];
*c217d954SCole Faust            pmul[i].configure(&p0, &p1, &s, 1.f, ConvertPolicy::WRAP, RoundingPolicy::TO_NEAREST_UP);
*c217d954SCole Faust            func[i].configure(&s, &t, ainfo);
*c217d954SCole Faust            s.allocator()->allocate();
*c217d954SCole Faust            t.allocator()->allocate();
*c217d954SCole Faust            p0.allocator()->allocate();
*c217d954SCole Faust            p1.allocator()->allocate();
*c217d954SCole Faust            library->fill_tensor_uniform(CLAccessor(p0), 0, -1.f, 1.f);
*c217d954SCole Faust            library->fill_tensor_uniform(CLAccessor(p1), 0, -1.f, 1.f);
*c217d954SCole Faust            pmul[i].run();
*c217d954SCole Faust            func[i].run();
*c217d954SCole Faust        });
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    for(auto &t : threads)
*c217d954SCole Faust    {
*c217d954SCole Faust        t.join();
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<float> rs{ tensor_shape, DataType::F32, 1 };
*c217d954SCole Faust    SimpleTensor<float> ra{ tensor_shape, DataType::F32, 1 };
*c217d954SCole Faust    SimpleTensor<float> rb{ tensor_shape, DataType::F32, 1 };
*c217d954SCole Faust    library->fill_tensor_uniform(ra, 0, -1.f, 1.f);
*c217d954SCole Faust    library->fill_tensor_uniform(rb, 0, -1.f, 1.f);
*c217d954SCole Faust    const auto mul    = reference::pixel_wise_multiplication<float, float, float>(ra, rb, 1.f, ConvertPolicy::WRAP, RoundingPolicy::TO_NEAREST_UP, DataType::F32);
*c217d954SCole Faust    const auto golden = reference::activation_layer<float>(mul, ainfo);
*c217d954SCole Faust    for(auto &d : dt)
*c217d954SCole Faust    {
*c217d954SCole Faust        validate(CLAccessor(d), golden);
*c217d954SCole Faust    }
*c217d954SCole Faust}
*c217d954SCole Faust
*c217d954SCole FaustTEST_SUITE_END() // MultipleThreadedScheduller
*c217d954SCole FaustTEST_SUITE_END() // UNIT
*c217d954SCole FaustTEST_SUITE_END() // CL
*c217d954SCole Faust} // namespace validation
*c217d954SCole Faust} // namespace test
*c217d954SCole Faust} // namespace arm_compute