blob: 71ee95b2aaa66f01c96012203048b8935e0ac2ba [file] [log] [blame]
//
// Copyright © 2022 Arm Ltd and Contributors. All rights reserved.
// SPDX-License-Identifier: MIT
//
#include "RefConvertFp32ToBf16Workload.hpp"
#include "RefWorkloadUtils.hpp"
#include <armnnUtils/FloatingPointConverter.hpp>
#include <BFloat16.hpp>
namespace armnn
{
void RefConvertFp32ToBf16Workload::Execute() const
{
Execute(m_Data.m_Inputs, m_Data.m_Outputs);
}
void RefConvertFp32ToBf16Workload::ExecuteAsync(ExecutionData& executionData)
{
WorkingMemDescriptor* workingMemDescriptor = static_cast<WorkingMemDescriptor*>(executionData.m_Data);
Execute(workingMemDescriptor->m_Inputs, workingMemDescriptor->m_Outputs);
}
void RefConvertFp32ToBf16Workload::Execute(std::vector<ITensorHandle*> inputs,
std::vector<ITensorHandle*> outputs) const
{
ARMNN_SCOPED_PROFILING_EVENT(Compute::CpuRef, "RefConvertFp32ToBf16Workload_Execute");
const float* const input = reinterpret_cast<const float*>(inputs[0]->Map());
BFloat16* const output = reinterpret_cast<BFloat16*>(outputs[0]->Map());
unsigned int numElements = GetTensorInfo(inputs[0]).GetNumElements();
armnnUtils::FloatingPointConverter::ConvertFloat32ToBFloat16(input, numElements, output);
}
} //namespace armnn