external/android-nn-driver/RequestThread_1_3.cpp

*3e777be0SXin Li//
*3e777be0SXin Li// Copyright © 2020 Arm Ltd and Contributors. All rights reserved.
*3e777be0SXin Li// SPDX-License-Identifier: MIT
*3e777be0SXin Li//
*3e777be0SXin Li
*3e777be0SXin Li#define LOG_TAG "ArmnnDriver"
*3e777be0SXin Li
*3e777be0SXin Li#include "ArmnnPreparedModel_1_3.hpp"
*3e777be0SXin Li#include "RequestThread_1_3.hpp"
*3e777be0SXin Li
*3e777be0SXin Li#include <log/log.h>
*3e777be0SXin Li
*3e777be0SXin Liusing namespace android;
*3e777be0SXin Li
*3e777be0SXin Linamespace armnn_driver
*3e777be0SXin Li{
*3e777be0SXin Li
*3e777be0SXin Litemplate <template <typename HalVersion> class PreparedModel, typename HalVersion, typename CallbackContext>
*3e777be0SXin LiRequestThread_1_3<PreparedModel, HalVersion, CallbackContext>::RequestThread_1_3()
*3e777be0SXin Li{
*3e777be0SXin Li    ALOGV("RequestThread_1_3::RequestThread_1_3()");
*3e777be0SXin Li    m_Thread = std::make_unique<std::thread>(&RequestThread_1_3::Process, this);
*3e777be0SXin Li}
*3e777be0SXin Li
*3e777be0SXin Litemplate <template <typename HalVersion> class PreparedModel, typename HalVersion, typename CallbackContext>
*3e777be0SXin LiRequestThread_1_3<PreparedModel, HalVersion, CallbackContext>::~RequestThread_1_3()
*3e777be0SXin Li{
*3e777be0SXin Li    ALOGV("RequestThread_1_3::~RequestThread_1_3()");
*3e777be0SXin Li
*3e777be0SXin Li    try
*3e777be0SXin Li    {
*3e777be0SXin Li        // Coverity fix: The following code may throw an exception of type std::length_error.
*3e777be0SXin Li
*3e777be0SXin Li        // This code is meant to to terminate the inner thread gracefully by posting an EXIT message
*3e777be0SXin Li        // to the thread's message queue. However, according to Coverity, this code could throw an exception and fail.
*3e777be0SXin Li        // Since only one static instance of RequestThread is used in the driver (in ArmnnPreparedModel),
*3e777be0SXin Li        // this destructor is called only when the application has been closed, which means that
*3e777be0SXin Li        // the inner thread will be terminated anyway, although abruptly, in the event that the destructor code throws.
*3e777be0SXin Li        // Wrapping the destructor's code with a try-catch block simply fixes the Coverity bug.
*3e777be0SXin Li
*3e777be0SXin Li        // Post an EXIT message to the thread
*3e777be0SXin Li        std::shared_ptr<AsyncExecuteData> nulldata(nullptr);
*3e777be0SXin Li        auto pMsg = std::make_shared<ThreadMsg>(ThreadMsgType::EXIT, nulldata);
*3e777be0SXin Li        PostMsg(pMsg);
*3e777be0SXin Li        // Wait for the thread to terminate, it is deleted automatically
*3e777be0SXin Li        m_Thread->join();
*3e777be0SXin Li    }
*3e777be0SXin Li    catch (const std::exception&) { } // Swallow any exception.
*3e777be0SXin Li}
*3e777be0SXin Li
*3e777be0SXin Litemplate <template <typename HalVersion> class PreparedModel, typename HalVersion, typename CallbackContext>
*3e777be0SXin Livoid RequestThread_1_3<PreparedModel, HalVersion, CallbackContext>::PostMsg(PreparedModel<HalVersion>* model,
*3e777be0SXin Li        std::shared_ptr<std::vector<::android::nn::RunTimePoolInfo>>& memPools,
*3e777be0SXin Li        std::shared_ptr<armnn::InputTensors>& inputTensors,
*3e777be0SXin Li        std::shared_ptr<armnn::OutputTensors>& outputTensors,
*3e777be0SXin Li        CallbackContext callbackContext)
*3e777be0SXin Li{
*3e777be0SXin Li    ALOGV("RequestThread_1_3::PostMsg(...)");
*3e777be0SXin Li    auto data = std::make_shared<AsyncExecuteData>(model,
*3e777be0SXin Li                                                   memPools,
*3e777be0SXin Li                                                   inputTensors,
*3e777be0SXin Li                                                   outputTensors,
*3e777be0SXin Li                                                   callbackContext);
*3e777be0SXin Li    auto pMsg = std::make_shared<ThreadMsg>(ThreadMsgType::REQUEST, data);
*3e777be0SXin Li    PostMsg(pMsg, model->GetModelPriority());
*3e777be0SXin Li}
*3e777be0SXin Li
*3e777be0SXin Litemplate <template <typename HalVersion> class PreparedModel, typename HalVersion, typename CallbackContext>
*3e777be0SXin Livoid RequestThread_1_3<PreparedModel, HalVersion, CallbackContext>::PostMsg(std::shared_ptr<ThreadMsg>& pMsg,
*3e777be0SXin Li                                                                        V1_3::Priority priority)
*3e777be0SXin Li{
*3e777be0SXin Li    ALOGV("RequestThread_1_3::PostMsg(pMsg)");
*3e777be0SXin Li    // Add a message to the queue and notify the request thread
*3e777be0SXin Li    std::unique_lock<std::mutex> lock(m_Mutex);
*3e777be0SXin Li    switch (priority) {
*3e777be0SXin Li        case V1_3::Priority::HIGH:
*3e777be0SXin Li            m_HighPriorityQueue.push(pMsg);
*3e777be0SXin Li            break;
*3e777be0SXin Li        case V1_3::Priority::LOW:
*3e777be0SXin Li            m_LowPriorityQueue.push(pMsg);
*3e777be0SXin Li            break;
*3e777be0SXin Li        case V1_3::Priority::MEDIUM:
*3e777be0SXin Li        default:
*3e777be0SXin Li            m_MediumPriorityQueue.push(pMsg);
*3e777be0SXin Li    }
*3e777be0SXin Li    m_Cv.notify_one();
*3e777be0SXin Li}
*3e777be0SXin Li
*3e777be0SXin Litemplate <template <typename HalVersion> class PreparedModel, typename HalVersion, typename CallbackContext>
*3e777be0SXin Livoid RequestThread_1_3<PreparedModel, HalVersion, CallbackContext>::Process()
*3e777be0SXin Li{
*3e777be0SXin Li    ALOGV("RequestThread_1_3::Process()");
*3e777be0SXin Li    int retireRate = RETIRE_RATE;
*3e777be0SXin Li    int highPriorityCount = 0;
*3e777be0SXin Li    int mediumPriorityCount = 0;
*3e777be0SXin Li    while (true)
*3e777be0SXin Li    {
*3e777be0SXin Li        std::shared_ptr<ThreadMsg> pMsg(nullptr);
*3e777be0SXin Li        {
*3e777be0SXin Li            // Wait for a message to be added to the queue
*3e777be0SXin Li            // This is in a separate scope to minimise the lifetime of the lock
*3e777be0SXin Li            std::unique_lock<std::mutex> lock(m_Mutex);
*3e777be0SXin Li            while (m_HighPriorityQueue.empty() && m_MediumPriorityQueue.empty() && m_LowPriorityQueue.empty())
*3e777be0SXin Li            {
*3e777be0SXin Li                m_Cv.wait(lock);
*3e777be0SXin Li            }
*3e777be0SXin Li            // Get the message to process from the front of each queue based on priority from high to low
*3e777be0SXin Li            // Get high priority first if it does not exceed the retire rate
*3e777be0SXin Li            if (!m_HighPriorityQueue.empty() && highPriorityCount < retireRate)
*3e777be0SXin Li            {
*3e777be0SXin Li                pMsg = m_HighPriorityQueue.front();
*3e777be0SXin Li                m_HighPriorityQueue.pop();
*3e777be0SXin Li                highPriorityCount += 1;
*3e777be0SXin Li            }
*3e777be0SXin Li            // If high priority queue is empty or the count exceeds the retire rate, get medium priority message
*3e777be0SXin Li            else if (!m_MediumPriorityQueue.empty() && mediumPriorityCount < retireRate)
*3e777be0SXin Li            {
*3e777be0SXin Li                pMsg = m_MediumPriorityQueue.front();
*3e777be0SXin Li                m_MediumPriorityQueue.pop();
*3e777be0SXin Li                mediumPriorityCount += 1;
*3e777be0SXin Li                // Reset high priority count
*3e777be0SXin Li                highPriorityCount = 0;
*3e777be0SXin Li            }
*3e777be0SXin Li            // If medium priority queue is empty or the count exceeds the retire rate, get low priority message
*3e777be0SXin Li            else if (!m_LowPriorityQueue.empty())
*3e777be0SXin Li            {
*3e777be0SXin Li                pMsg = m_LowPriorityQueue.front();
*3e777be0SXin Li                m_LowPriorityQueue.pop();
*3e777be0SXin Li                // Reset high and medium priority count
*3e777be0SXin Li                highPriorityCount = 0;
*3e777be0SXin Li                mediumPriorityCount = 0;
*3e777be0SXin Li            }
*3e777be0SXin Li            else
*3e777be0SXin Li            {
*3e777be0SXin Li                // Reset high and medium priority count
*3e777be0SXin Li                highPriorityCount = 0;
*3e777be0SXin Li                mediumPriorityCount = 0;
*3e777be0SXin Li                continue;
*3e777be0SXin Li            }
*3e777be0SXin Li        }
*3e777be0SXin Li
*3e777be0SXin Li        switch (pMsg->type)
*3e777be0SXin Li        {
*3e777be0SXin Li            case ThreadMsgType::REQUEST:
*3e777be0SXin Li            {
*3e777be0SXin Li                ALOGV("RequestThread_1_3::Process() - request");
*3e777be0SXin Li                // invoke the asynchronous execution method
*3e777be0SXin Li                PreparedModel<HalVersion>* model = pMsg->data->m_Model;
*3e777be0SXin Li                model->ExecuteGraph(pMsg->data->m_MemPools,
*3e777be0SXin Li                                    *(pMsg->data->m_InputTensors),
*3e777be0SXin Li                                    *(pMsg->data->m_OutputTensors),
*3e777be0SXin Li                                    pMsg->data->m_CallbackContext);
*3e777be0SXin Li                break;
*3e777be0SXin Li            }
*3e777be0SXin Li
*3e777be0SXin Li            case ThreadMsgType::EXIT:
*3e777be0SXin Li            {
*3e777be0SXin Li                ALOGV("RequestThread_1_3::Process() - exit");
*3e777be0SXin Li                // delete all remaining messages (there should not be any)
*3e777be0SXin Li                std::unique_lock<std::mutex> lock(m_Mutex);
*3e777be0SXin Li                while (!m_HighPriorityQueue.empty())
*3e777be0SXin Li                {
*3e777be0SXin Li                    m_HighPriorityQueue.pop();
*3e777be0SXin Li                }
*3e777be0SXin Li                while (!m_MediumPriorityQueue.empty())
*3e777be0SXin Li                {
*3e777be0SXin Li                    m_MediumPriorityQueue.pop();
*3e777be0SXin Li                }
*3e777be0SXin Li                while (!m_LowPriorityQueue.empty())
*3e777be0SXin Li                {
*3e777be0SXin Li                    m_LowPriorityQueue.pop();
*3e777be0SXin Li                }
*3e777be0SXin Li                return;
*3e777be0SXin Li            }
*3e777be0SXin Li
*3e777be0SXin Li            default:
*3e777be0SXin Li                // this should be unreachable
*3e777be0SXin Li                throw armnn::RuntimeException("ArmNN: RequestThread_1_3: invalid message type");
*3e777be0SXin Li        }
*3e777be0SXin Li    }
*3e777be0SXin Li}
*3e777be0SXin Li
*3e777be0SXin Li///
*3e777be0SXin Li/// Class template specializations
*3e777be0SXin Li///
*3e777be0SXin Li
*3e777be0SXin Litemplate class RequestThread_1_3<ArmnnPreparedModel_1_3, hal_1_3::HalPolicy, CallbackContext_1_3>;
*3e777be0SXin Li
*3e777be0SXin Li} // namespace armnn_driver