├── .gitignore
├── .gitignore.license
├── 1.0
    ├── ArmnnDriver.hpp
    ├── ArmnnDriverImpl.cpp
    ├── ArmnnDriverImpl.hpp
    ├── FullyConnected.hpp
    ├── HalPolicy.cpp
    └── HalPolicy.hpp
├── 1.1
    ├── ArmnnDriver.hpp
    ├── ArmnnDriverImpl.cpp
    ├── ArmnnDriverImpl.hpp
    ├── HalPolicy.cpp
    └── HalPolicy.hpp
├── 1.2
    ├── ArmnnDriver.hpp
    ├── ArmnnDriverImpl.cpp
    ├── ArmnnDriverImpl.hpp
    ├── HalPolicy.cpp
    └── HalPolicy.hpp
├── 1.3
    ├── ArmnnDriver.hpp
    ├── ArmnnDriverImpl.cpp
    ├── ArmnnDriverImpl.hpp
    ├── HalPolicy.cpp
    └── HalPolicy.hpp
├── Android.bp
├── Android.mk
├── ArmnnDevice.cpp
├── ArmnnDevice.hpp
├── ArmnnDriver.hpp
├── ArmnnDriverImpl.cpp
├── ArmnnDriverImpl.hpp
├── ArmnnPreparedModel.cpp
├── ArmnnPreparedModel.hpp
├── ArmnnPreparedModel_1_2.cpp
├── ArmnnPreparedModel_1_2.hpp
├── ArmnnPreparedModel_1_3.cpp
├── ArmnnPreparedModel_1_3.hpp
├── CacheDataHandler.cpp
├── CacheDataHandler.hpp
├── ConversionUtils.cpp
├── ConversionUtils.hpp
├── ConversionUtils_1_2.hpp
├── ConversionUtils_1_3.hpp
├── DriverOptions.cpp
├── DriverOptions.hpp
├── LICENSE
├── LICENSE.spdx
├── LICENSES
    └── MIT.txt
├── ModelToINetworkConverter.cpp
├── ModelToINetworkConverter.hpp
├── NnapiSupport.txt
├── NnapiSupport.txt.license
├── README.md
├── README.md.license
├── RequestThread.cpp
├── RequestThread.hpp
├── RequestThread_1_3.cpp
├── RequestThread_1_3.hpp
├── SECURITY.md
├── SECURITY.md.license
├── SystemPropertiesUtils.hpp
├── Utils.cpp
├── Utils.hpp
├── android.hardware.neuralnetworks@1.0-service-armnn.rc
├── android.hardware.neuralnetworks@1.0-service-armnn.rc.license
├── android.hardware.neuralnetworks@1.1-service-armnn.rc
├── android.hardware.neuralnetworks@1.1-service-armnn.rc.license
├── android.hardware.neuralnetworks@1.2-service-armnn.rc
├── android.hardware.neuralnetworks@1.2-service-armnn.rc.license
├── android.hardware.neuralnetworks@1.3-service-armnn.rc
├── android.hardware.neuralnetworks@1.3-service-armnn.rc.license
├── docs
    ├── FAQ.md
    ├── FAQ.md.license
    ├── IntegratorGuide.md
    └── IntegratorGuide.md.license
├── service.cpp
├── setup.sh
└── test
    ├── 1.0
        ├── Convolution2D.cpp
        ├── FullyConnectedReshape.cpp
        └── Lstm.cpp
    ├── 1.1
        ├── Convolution2D.cpp
        ├── Lstm.cpp
        ├── Mean.cpp
        └── Transpose.cpp
    ├── 1.2
        ├── Capabilities.cpp
        ├── Dilation.cpp
        ├── Lstm.cpp
        ├── Mean.cpp
        └── UnidirectionalSequenceLstm.cpp
    ├── 1.3
        ├── QLstm.cpp
        └── QosTests.cpp
    ├── Android.mk
    ├── Concat.cpp
    ├── Concurrent.cpp
    ├── Convolution2D.hpp
    ├── Dilation.hpp
    ├── DriverTestHelpers.cpp
    ├── DriverTestHelpers.hpp
    ├── FullyConnected.cpp
    ├── GenericLayerTests.cpp
    ├── Lstm.hpp
    ├── SystemProperties.cpp
    ├── TestHalfTensor.cpp
    ├── TestHalfTensor.hpp
    ├── TestTensor.cpp
    ├── TestTensor.hpp
    ├── Tests.cpp
    ├── UnidirectionalSequenceLstm.hpp
    └── UtilsTests.cpp


/.gitignore:
--------------------------------------------------------------------------------
1 | armnn
2 | boost_1_64_0
3 | clframework
4 | flatbuffers-1.12.0
5 | prebuilt
6 | .vscode/settings.json
7 | .gitignore
8 | 


--------------------------------------------------------------------------------
/.gitignore.license:
--------------------------------------------------------------------------------
1 | #
2 | # Copyright © 2018, 2022 Arm Ltd and Contributors. All rights reserved.
3 | # SPDX-License-Identifier: MIT
4 | #
5 | 


--------------------------------------------------------------------------------
/1.0/ArmnnDriver.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #pragma once
 7 | 
 8 | #include <HalInterfaces.h>
 9 | 
10 | #include "../ArmnnDevice.hpp"
11 | #include "ArmnnDriverImpl.hpp"
12 | #include "HalPolicy.hpp"
13 | 
14 | #include "../ArmnnDriverImpl.hpp"
15 | 
16 | #include <log/log.h>
17 | 
18 | namespace armnn_driver
19 | {
20 | namespace hal_1_0
21 | {
22 | 
23 | class ArmnnDriver : public ArmnnDevice, public V1_0::IDevice
24 | {
25 | public:
26 |     ArmnnDriver(DriverOptions options)
27 |         : ArmnnDevice(std::move(options))
28 |     {
29 |         ALOGV("hal_1_0::ArmnnDriver::ArmnnDriver()");
30 |     }
31 |     ~ArmnnDriver() {}
32 | 
33 | public:
34 |     Return<void> getCapabilities(V1_0::IDevice::getCapabilities_cb cb) override
35 |     {
36 |         ALOGV("hal_1_0::ArmnnDriver::getCapabilities()");
37 | 
38 |         return hal_1_0::ArmnnDriverImpl::getCapabilities(m_Runtime, cb);
39 |     }
40 | 
41 |     Return<void> getSupportedOperations(const V1_0::Model& model,
42 |                                         V1_0::IDevice::getSupportedOperations_cb cb) override
43 |     {
44 |         ALOGV("hal_1_0::ArmnnDriver::getSupportedOperations()");
45 | 
46 |         return armnn_driver::ArmnnDriverImpl<HalPolicy>::getSupportedOperations(m_Runtime, m_Options, model, cb);
47 |     }
48 | 
49 |     Return<V1_0::ErrorStatus> prepareModel(const V1_0::Model& model,
50 |                                            const android::sp<V1_0::IPreparedModelCallback>& cb) override
51 |     {
52 |         ALOGV("hal_1_0::ArmnnDriver::prepareModel()");
53 | 
54 |         return armnn_driver::ArmnnDriverImpl<HalPolicy>::prepareModel(m_Runtime,
55 |                                                                       m_ClTunedParameters,
56 |                                                                       m_Options,
57 |                                                                       model,
58 |                                                                       cb);
59 |     }
60 | 
61 |     Return<V1_0::DeviceStatus> getStatus() override
62 |     {
63 |         ALOGV("hal_1_0::ArmnnDriver::getStatus()");
64 | 
65 |         return armnn_driver::ArmnnDriverImpl<HalPolicy>::getStatus();
66 |     }
67 | };
68 | 
69 | } // namespace hal_1_0
70 | } // namespace armnn_driver
71 | 


--------------------------------------------------------------------------------
/1.0/ArmnnDriverImpl.cpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #include "ArmnnDriverImpl.hpp"
 7 | #include "../SystemPropertiesUtils.hpp"
 8 | 
 9 | #include <log/log.h>
10 | 
11 | namespace
12 | {
13 | 
14 | const char *g_Float32PerformanceExecTimeName      = "ArmNN.float32Performance.execTime";
15 | const char *g_Float32PerformancePowerUsageName    = "ArmNN.float32Performance.powerUsage";
16 | const char *g_Quantized8PerformanceExecTimeName   = "ArmNN.quantized8Performance.execTime";
17 | const char *g_Quantized8PerformancePowerUsageName = "ArmNN.quantized8Performance.powerUsage";
18 | 
19 | } // anonymous namespace
20 | 
21 | namespace armnn_driver
22 | {
23 | namespace hal_1_0
24 | {
25 | 
26 | Return<void> ArmnnDriverImpl::getCapabilities(const armnn::IRuntimePtr& runtime,
27 |                                               V1_0::IDevice::getCapabilities_cb cb)
28 | {
29 |     ALOGV("hal_1_0::ArmnnDriverImpl::getCapabilities()");
30 | 
31 |     V1_0::Capabilities capabilities;
32 |     if (runtime)
33 |     {
34 |         capabilities.float32Performance.execTime =
35 |             ParseSystemProperty(g_Float32PerformanceExecTimeName, .1f);
36 | 
37 |         capabilities.float32Performance.powerUsage =
38 |             ParseSystemProperty(g_Float32PerformancePowerUsageName, .1f);
39 | 
40 |         capabilities.quantized8Performance.execTime =
41 |             ParseSystemProperty(g_Quantized8PerformanceExecTimeName, .1f);
42 | 
43 |         capabilities.quantized8Performance.powerUsage =
44 |             ParseSystemProperty(g_Quantized8PerformancePowerUsageName, .1f);
45 | 
46 |         cb(V1_0::ErrorStatus::NONE, capabilities);
47 |     }
48 |     else
49 |     {
50 |         capabilities.float32Performance.execTime      = 0;
51 |         capabilities.float32Performance.powerUsage    = 0;
52 |         capabilities.quantized8Performance.execTime   = 0;
53 |         capabilities.quantized8Performance.powerUsage = 0;
54 | 
55 |         cb(V1_0::ErrorStatus::DEVICE_UNAVAILABLE, capabilities);
56 |     }
57 | 
58 |     return Void();
59 | }
60 | 
61 | } // namespace hal_1_0
62 | } // namespace armnn_driver


--------------------------------------------------------------------------------
/1.0/ArmnnDriverImpl.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #pragma once
 7 | 
 8 | #include <HalInterfaces.h>
 9 | 
10 | #include "../DriverOptions.hpp"
11 | 
12 | #include <armnn/ArmNN.hpp>
13 | 
14 | #ifdef ARMNN_ANDROID_R
15 | using namespace android::nn::hal;
16 | #endif
17 | 
18 | #ifdef ARMNN_ANDROID_S
19 | using namespace android::hardware;
20 | #endif
21 | 
22 | namespace V1_0 = ::android::hardware::neuralnetworks::V1_0;
23 | 
24 | namespace armnn_driver
25 | {
26 | namespace hal_1_0
27 | {
28 | 
29 | class ArmnnDriverImpl
30 | {
31 | public:
32 |     static Return<void> getCapabilities(const armnn::IRuntimePtr& runtime, V1_0::IDevice::getCapabilities_cb cb);
33 | };
34 | 
35 | } // namespace hal_1_0
36 | } // namespace armnn_driver
37 | 


--------------------------------------------------------------------------------
/1.0/FullyConnected.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #pragma once
 7 | 
 8 | #include <armnn/Tensor.hpp>
 9 | 
10 | #include "../ConversionUtils.hpp"
11 | 
12 | namespace armnn_driver
13 | {
14 | 
15 | inline armnn::TensorShape FlattenFullyConnectedInput(const armnn::TensorShape& inputShape,
16 |                                                      const armnn::TensorShape& weightsShape)
17 | {
18 |     if (inputShape.GetNumDimensions() > 2U)
19 |     {
20 |         unsigned int totalInputElements = inputShape.GetNumElements();
21 |         unsigned int inputSize = weightsShape[1];
22 | 
23 |         unsigned int batchSize = totalInputElements / inputSize;
24 | 
25 |         if(totalInputElements % batchSize != 0)
26 |         {
27 |             throw std::runtime_error("Failed to deduce tensor shape");
28 |         }
29 | 
30 |         return armnn::TensorShape({batchSize, inputSize});
31 |     }
32 |     else
33 |     {
34 |         return inputShape;
35 |     }
36 | }
37 | 
38 | inline bool VerifyFullyConnectedShapes(const armnn::TensorShape& inputShape,
39 |                                        const armnn::TensorShape& weightsShape,
40 |                                        const armnn::TensorShape& outputShape,
41 |                                        bool  transposeWeightMatrix)
42 | {
43 |     unsigned int dimIdx = transposeWeightMatrix ? 0 : 1;
44 |     return (inputShape[0] == outputShape[0] && weightsShape[dimIdx] == outputShape[1]);
45 | }
46 | 
47 | }


--------------------------------------------------------------------------------
/1.0/HalPolicy.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017-2021,2023 Arm Ltd and Contributors. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #pragma once
 7 | 
 8 | #include "../ConversionUtils.hpp"
 9 | 
10 | #include <HalInterfaces.h>
11 | 
12 | namespace V1_0 = ::android::hardware::neuralnetworks::V1_0;
13 | 
14 | namespace armnn_driver
15 | {
16 | namespace hal_1_0
17 | {
18 | 
19 | class HalPolicy
20 | {
21 | public:
22 |     using Model                     = V1_0::Model;
23 |     using Operand                   = V1_0::Operand;
24 |     using OperandLifeTime           = V1_0::OperandLifeTime;
25 |     using OperandType               = V1_0::OperandType;
26 |     using Operation                 = V1_0::Operation;
27 |     using OperationType             = V1_0::OperationType;
28 |     using getSupportedOperations_cb = V1_0::IDevice::getSupportedOperations_cb;
29 |     using ErrorStatus               = V1_0::ErrorStatus;
30 | 
31 |     static bool ConvertOperation(const Operation& operation, const Model& model, ConversionData& data);
32 | 
33 | private:
34 |     static bool ConvertAveragePool2d(const Operation& operation, const Model& model, ConversionData& data);
35 | 
36 |     static bool ConvertConcatenation(const Operation& operation, const Model& model, ConversionData& data);
37 | 
38 |     static bool ConvertConv2d(const Operation& operation, const Model& model, ConversionData& data);
39 | 
40 |     static bool ConvertDepthToSpace(const Operation& operation, const Model& model, ConversionData& data);
41 | 
42 |     static bool ConvertDepthwiseConv2d(const Operation& operation, const Model& model, ConversionData& data);
43 | 
44 |     static bool ConvertDequantize(const Operation& operation, const Model& model, ConversionData& data);
45 | 
46 |     static bool ConvertElementwiseBinary(const Operation& operation,
47 |                                          const Model& model,
48 |                                          ConversionData& data,
49 |                                          armnn::BinaryOperation binaryOperation);
50 | 
51 |     static bool ConvertFloor(const Operation& operation, const Model& model, ConversionData& data);
52 | 
53 |     static bool ConvertFullyConnected(const Operation& operation, const Model& model, ConversionData& data);
54 | 
55 |     static bool ConvertLocalResponseNormalization(const Operation& operation,
56 |                                                   const Model& model,
57 |                                                   ConversionData& data);
58 | 
59 |     static bool ConvertLogistic(const Operation& operation, const Model& model, ConversionData& data);
60 | 
61 |     static bool ConvertLstm(const Operation& operation, const Model& model, ConversionData& data);
62 | 
63 |     static bool ConvertL2Normalization(const Operation& operation, const Model& model, ConversionData& data);
64 | 
65 |     static bool ConvertL2Pool2d(const Operation& operation, const Model& model, ConversionData& data);
66 | 
67 |     static bool ConvertMaxPool2d(const Operation& operation, const Model& model, ConversionData& data);
68 | 
69 |     static bool ConvertReLu(const Operation& operation, const Model& model, ConversionData& data);
70 | 
71 |     static bool ConvertReLu1(const Operation& operation, const Model& model, ConversionData& data);
72 | 
73 |     static bool ConvertReLu6(const Operation& operation, const Model& model, ConversionData& data);
74 | 
75 |     static bool ConvertSoftmax(const Operation& operation, const Model& model, ConversionData& data);
76 | 
77 |     static bool ConvertReshape(const Operation& operation, const Model& model, ConversionData& data);
78 | 
79 |     static bool ConvertResizeBilinear(const Operation& operation, const Model& model, ConversionData& data);
80 | 
81 |     static bool ConvertSpaceToDepth(const Operation& operation, const Model& model, ConversionData& data);
82 | 
83 |     static bool ConvertTanH(const Operation& operation, const Model& model, ConversionData& data);
84 | 
85 |     static bool ValidateConv2dParameters(const Operation& operation);
86 | 
87 |     static bool ValidateDepthwiseConv2dParameters(const Operation& operation);
88 | };
89 | 
90 | } // namespace hal_1_0
91 | } // namespace armnn_driver
92 | 


--------------------------------------------------------------------------------
/1.1/ArmnnDriver.hpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2017 Arm Ltd. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #pragma once
  7 | 
  8 | #include <HalInterfaces.h>
  9 | 
 10 | #include "../ArmnnDevice.hpp"
 11 | #include "ArmnnDriverImpl.hpp"
 12 | #include "HalPolicy.hpp"
 13 | 
 14 | #include "../ArmnnDriverImpl.hpp"
 15 | #include "../1.0/ArmnnDriverImpl.hpp"
 16 | #include "../1.0/HalPolicy.hpp"
 17 | 
 18 | #include <log/log.h>
 19 | 
 20 | namespace armnn_driver
 21 | {
 22 | namespace hal_1_1
 23 | {
 24 | 
 25 | class ArmnnDriver : public ArmnnDevice, public V1_1::IDevice
 26 | {
 27 | public:
 28 |     ArmnnDriver(DriverOptions options)
 29 |         : ArmnnDevice(std::move(options))
 30 |     {
 31 |         ALOGV("hal_1_1::ArmnnDriver::ArmnnDriver()");
 32 |     }
 33 |     ~ArmnnDriver() {}
 34 | 
 35 | public:
 36 | 
 37 |     Return<void> getCapabilities(V1_0::IDevice::getCapabilities_cb cb) override
 38 |     {
 39 |         ALOGV("hal_1_1::ArmnnDriver::getCapabilities()");
 40 | 
 41 |         return hal_1_0::ArmnnDriverImpl::getCapabilities(m_Runtime, cb);
 42 |     }
 43 | 
 44 |     Return<void> getSupportedOperations(const V1_0::Model& model,
 45 |                                         V1_0::IDevice::getSupportedOperations_cb cb) override
 46 |     {
 47 |         ALOGV("hal_1_1::ArmnnDriver::getSupportedOperations()");
 48 | 
 49 |         return armnn_driver::ArmnnDriverImpl<hal_1_0::HalPolicy>::getSupportedOperations(m_Runtime,
 50 |                                                                                          m_Options,
 51 |                                                                                          model,
 52 |                                                                                          cb);
 53 |     }
 54 | 
 55 |     Return<V1_0::ErrorStatus> prepareModel(const V1_0::Model& model,
 56 |                                            const android::sp<V1_0::IPreparedModelCallback>& cb) override
 57 |     {
 58 |         ALOGV("hal_1_1::ArmnnDriver::prepareModel()");
 59 | 
 60 |         return armnn_driver::ArmnnDriverImpl<hal_1_0::HalPolicy>::prepareModel(m_Runtime,
 61 |                                                                                m_ClTunedParameters,
 62 |                                                                                m_Options,
 63 |                                                                                model,
 64 |                                                                                cb);
 65 |     }
 66 | 
 67 |     Return<void> getCapabilities_1_1(V1_1::IDevice::getCapabilities_1_1_cb cb) override
 68 |     {
 69 |         ALOGV("hal_1_1::ArmnnDriver::getCapabilities_1_1()");
 70 | 
 71 |         return hal_1_1::ArmnnDriverImpl::getCapabilities_1_1(m_Runtime, cb);
 72 |     }
 73 | 
 74 |     Return<void> getSupportedOperations_1_1(const V1_1::Model& model,
 75 |                                             V1_1::IDevice::getSupportedOperations_1_1_cb cb) override
 76 |     {
 77 |         ALOGV("hal_1_1::ArmnnDriver::getSupportedOperations_1_1()");
 78 | 
 79 |         return armnn_driver::ArmnnDriverImpl<hal_1_1::HalPolicy>::getSupportedOperations(m_Runtime,
 80 |                                                                                          m_Options,
 81 |                                                                                          model,
 82 |                                                                                          cb);
 83 |     }
 84 | 
 85 |     Return<V1_0::ErrorStatus> prepareModel_1_1(const V1_1::Model& model,
 86 |                                                V1_1::ExecutionPreference preference,
 87 |                                                const android::sp<V1_0::IPreparedModelCallback>& cb) override
 88 |     {
 89 |         ALOGV("hal_1_1::ArmnnDriver::prepareModel_1_1()");
 90 | 
 91 |         if (!(preference == V1_1::ExecutionPreference::LOW_POWER ||
 92 |               preference == V1_1::ExecutionPreference::FAST_SINGLE_ANSWER ||
 93 |               preference == V1_1::ExecutionPreference::SUSTAINED_SPEED))
 94 |         {
 95 |             ALOGV("hal_1_1::ArmnnDriver::prepareModel_1_1: Invalid execution preference");
 96 |             cb->notify(V1_0::ErrorStatus::INVALID_ARGUMENT, nullptr);
 97 |             return V1_0::ErrorStatus::INVALID_ARGUMENT;
 98 |         }
 99 | 
100 |         return armnn_driver::ArmnnDriverImpl<hal_1_1::HalPolicy>::prepareModel(m_Runtime,
101 |                                                                                m_ClTunedParameters,
102 |                                                                                m_Options,
103 |                                                                                model,
104 |                                                                                cb,
105 |                                                                                model.relaxComputationFloat32toFloat16
106 |                                                                                && m_Options.GetFp16Enabled());
107 |     }
108 | 
109 |     Return<V1_0::DeviceStatus> getStatus() override
110 |     {
111 |         ALOGV("hal_1_1::ArmnnDriver::getStatus()");
112 | 
113 |         return armnn_driver::ArmnnDriverImpl<hal_1_1::HalPolicy>::getStatus();
114 |     }
115 | };
116 | 
117 | } // namespace hal_1_1
118 | } // namespace armnn_driver
119 | 


--------------------------------------------------------------------------------
/1.1/ArmnnDriverImpl.cpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #include "ArmnnDriverImpl.hpp"
 7 | #include "../SystemPropertiesUtils.hpp"
 8 | 
 9 | #include <log/log.h>
10 | 
11 | namespace
12 | {
13 | 
14 | const char *g_Float32PerformanceExecTimeName                   = "ArmNN.float32Performance.execTime";
15 | const char *g_Float32PerformancePowerUsageName                 = "ArmNN.float32Performance.powerUsage";
16 | const char *g_Quantized8PerformanceExecTimeName                = "ArmNN.quantized8Performance.execTime";
17 | const char *g_Quantized8PerformancePowerUsageName              = "ArmNN.quantized8Performance.powerUsage";
18 | const char *g_RelaxedFloat32toFloat16PerformanceExecTime       = "ArmNN.relaxedFloat32toFloat16Performance.execTime";
19 | const char *g_RelaxedFloat32toFloat16PerformancePowerUsageName = "ArmNN.relaxedFloat32toFloat16Performance.powerUsage";
20 | 
21 | } // anonymous namespace
22 | 
23 | namespace armnn_driver
24 | {
25 | namespace hal_1_1
26 | {
27 | 
28 | Return<void> ArmnnDriverImpl::getCapabilities_1_1(const armnn::IRuntimePtr& runtime,
29 |                                                   V1_1::IDevice::getCapabilities_1_1_cb cb)
30 | {
31 |     ALOGV("hal_1_1::ArmnnDriverImpl::getCapabilities()");
32 | 
33 |     V1_1::Capabilities capabilities;
34 |     if (runtime)
35 |     {
36 |         capabilities.float32Performance.execTime =
37 |             ParseSystemProperty(g_Float32PerformanceExecTimeName, .1f);
38 | 
39 |         capabilities.float32Performance.powerUsage =
40 |             ParseSystemProperty(g_Float32PerformancePowerUsageName, .1f);
41 | 
42 |         capabilities.quantized8Performance.execTime =
43 |             ParseSystemProperty(g_Quantized8PerformanceExecTimeName, .1f);
44 | 
45 |         capabilities.quantized8Performance.powerUsage =
46 |             ParseSystemProperty(g_Quantized8PerformancePowerUsageName, .1f);
47 | 
48 |         capabilities.relaxedFloat32toFloat16Performance.execTime =
49 |             ParseSystemProperty(g_RelaxedFloat32toFloat16PerformanceExecTime, .1f);
50 | 
51 |         capabilities.relaxedFloat32toFloat16Performance.powerUsage =
52 |             ParseSystemProperty(g_RelaxedFloat32toFloat16PerformancePowerUsageName, .1f);
53 | 
54 |         cb(V1_0::ErrorStatus::NONE, capabilities);
55 |     }
56 |     else
57 |     {
58 |         capabilities.float32Performance.execTime                   = 0;
59 |         capabilities.float32Performance.powerUsage                 = 0;
60 |         capabilities.quantized8Performance.execTime                = 0;
61 |         capabilities.quantized8Performance.powerUsage              = 0;
62 |         capabilities.relaxedFloat32toFloat16Performance.execTime   = 0;
63 |         capabilities.relaxedFloat32toFloat16Performance.powerUsage = 0;
64 | 
65 |         cb(V1_0::ErrorStatus::DEVICE_UNAVAILABLE, capabilities);
66 |     }
67 | 
68 |     return Void();
69 | }
70 | 
71 | } // namespace hal_1_1
72 | } // namespace armnn_driver


--------------------------------------------------------------------------------
/1.1/ArmnnDriverImpl.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #pragma once
 7 | 
 8 | #include <HalInterfaces.h>
 9 | 
10 | #include "../DriverOptions.hpp"
11 | 
12 | #include <armnn/ArmNN.hpp>
13 | 
14 | #ifdef ARMNN_ANDROID_R
15 | using namespace android::nn::hal;
16 | #endif
17 | 
18 | #ifdef ARMNN_ANDROID_S
19 | using namespace android::hardware;
20 | #endif
21 | 
22 | 
23 | namespace V1_0 = ::android::hardware::neuralnetworks::V1_0;
24 | namespace V1_1 = ::android::hardware::neuralnetworks::V1_1;
25 | 
26 | namespace armnn_driver
27 | {
28 | namespace hal_1_1
29 | {
30 | 
31 | class ArmnnDriverImpl
32 | {
33 | public:
34 |     static Return<void> getCapabilities_1_1(const armnn::IRuntimePtr& runtime,
35 |                                             V1_1::IDevice::getCapabilities_1_1_cb cb);
36 | };
37 | 
38 | } // namespace hal_1_1
39 | } // namespace armnn_driver
40 | 


--------------------------------------------------------------------------------
/1.1/HalPolicy.cpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2017-2019,2023 Arm Ltd and Contributors. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #include "HalPolicy.hpp"
  7 | 
  8 | #include "Utils.hpp"
  9 | 
 10 | #include "../1.0/HalPolicy.hpp"
 11 | 
 12 | namespace
 13 | {
 14 | static std::vector<V1_0::OperationType> opsEquivalentInV10({
 15 |     V1_0::OperationType::ADD,
 16 |     V1_0::OperationType::AVERAGE_POOL_2D,
 17 |     V1_0::OperationType::CONCATENATION,
 18 |     V1_0::OperationType::CONV_2D,
 19 |     V1_0::OperationType::DEPTH_TO_SPACE,
 20 |     V1_0::OperationType::DEPTHWISE_CONV_2D,
 21 |     V1_0::OperationType::DEQUANTIZE,
 22 |     V1_0::OperationType::FLOOR,
 23 |     V1_0::OperationType::FULLY_CONNECTED,
 24 |     V1_0::OperationType::LOCAL_RESPONSE_NORMALIZATION,
 25 |     V1_0::OperationType::LOGISTIC,
 26 |     V1_0::OperationType::LSTM,
 27 |     V1_0::OperationType::L2_NORMALIZATION,
 28 |     V1_0::OperationType::L2_POOL_2D,
 29 |     V1_0::OperationType::MAX_POOL_2D,
 30 |     V1_0::OperationType::MUL,
 31 |     V1_0::OperationType::RELU,
 32 |     V1_0::OperationType::RELU1,
 33 |     V1_0::OperationType::RELU6,
 34 |     V1_0::OperationType::SOFTMAX,
 35 |     V1_0::OperationType::SPACE_TO_DEPTH,
 36 |     V1_0::OperationType::TANH,
 37 |     V1_0::OperationType::RESHAPE,
 38 |     V1_0::OperationType::RESIZE_BILINEAR,
 39 | });
 40 | 
 41 | bool CompliantWithVersion10(const V1_1::Operation & operation)
 42 | {
 43 |     std::vector<V1_0::OperationType>::iterator it;
 44 |     it = std::find(opsEquivalentInV10.begin(), opsEquivalentInV10.end(),
 45 |                    static_cast<V1_0::OperationType>(operation.type));
 46 | 
 47 |     if(it != opsEquivalentInV10.end())
 48 |     {
 49 |         return true;
 50 |     }
 51 |     return false;
 52 | }
 53 | 
 54 | V1_0::Operation ConvertOperationToVersion10(const V1_1::Operation & operation)
 55 | {
 56 |     V1_0::Operation v10Operation;
 57 |     v10Operation.type = static_cast<V1_0::OperationType>(operation.type);
 58 |     v10Operation.inputs = operation.inputs;
 59 |     v10Operation.outputs = operation.outputs;
 60 |     return v10Operation;
 61 | }
 62 | }
 63 | 
 64 | namespace armnn_driver
 65 | {
 66 | namespace hal_1_1
 67 | {
 68 | 
 69 | bool HalPolicy::ConvertOperation(const Operation& operation, const Model& model, ConversionData& data)
 70 | {
 71 |     if (CompliantWithVersion10(operation))
 72 |     {
 73 |         hal_1_0::HalPolicy::Operation v10Operation = ConvertOperationToVersion10(operation);
 74 |         hal_1_0::HalPolicy::Model v10Model = convertToV1_0(model);
 75 | 
 76 |         return hal_1_0::HalPolicy::ConvertOperation(v10Operation, v10Model, data);
 77 |     }
 78 |     else
 79 |     {
 80 |         switch (operation.type)
 81 |         {
 82 |             case V1_1::OperationType::DIV:
 83 |                 return ConvertElementwiseBinary(operation, model, data, armnn::BinaryOperation::Div);
 84 |             case V1_1::OperationType::SUB:
 85 |                 return ConvertElementwiseBinary(operation, model, data, armnn::BinaryOperation::Sub);
 86 |             case V1_1::OperationType::MEAN:
 87 |                 return ConvertMean(operation, model, data);
 88 |             case V1_1::OperationType::PAD:
 89 |                 return ConvertPad(operation, model, data);
 90 |             case V1_1::OperationType::SPACE_TO_BATCH_ND:
 91 |                 return ConvertSpaceToBatchNd(operation, model, data);
 92 |             case V1_1::OperationType::SQUEEZE:
 93 |                 return ConvertSqueeze(operation, model, data);
 94 |             case V1_1::OperationType::STRIDED_SLICE:
 95 |                 return ConvertStridedSlice(operation, model, data);
 96 |             case V1_1::OperationType::TRANSPOSE:
 97 |                 return ConvertTranspose(operation, model, data);
 98 |             case V1_1::OperationType::BATCH_TO_SPACE_ND:
 99 |                 return ConvertBatchToSpaceNd(operation, model, data);
100 |             default:
101 |                 return Fail("%s: Operation type %s not supported in ArmnnDriver",
102 |                             __func__, toString(operation.type).c_str());
103 |         }
104 |     }
105 | }
106 | 
107 | bool HalPolicy::ConvertElementwiseBinary(const Operation& operation,
108 |                                          const Model& model,
109 |                                          ConversionData& data,
110 |                                          armnn::BinaryOperation binaryOperation)
111 | {
112 |     ALOGV("hal_1_1::HalPolicy::ConvertElementwiseBinary()");
113 |     return ::ConvertElementwiseBinary<hal_1_1::HalPolicy>(operation, model, data, binaryOperation);
114 | }
115 | 
116 | bool HalPolicy::ConvertMean(const Operation& operation, const Model& model, ConversionData& data)
117 | {
118 |     ALOGV("hal_1_1::HalPolicy::ConvertMean()");
119 |     return ::ConvertMean<hal_1_1::HalPolicy>(operation, model, data);
120 | }
121 | 
122 | bool HalPolicy::ConvertPad(const Operation& operation, const Model& model, ConversionData& data)
123 | {
124 |     ALOGV("hal_1_1::HalPolicy::ConvertPad()");
125 |     return ::ConvertPad<hal_1_1::HalPolicy>(operation, model, data);
126 | }
127 | 
128 | bool HalPolicy::ConvertSpaceToBatchNd(const Operation& operation, const Model& model, ConversionData& data)
129 | {
130 |     ALOGV("hal_1_1::HalPolicy::ConvertSpaceToBatchNd()");
131 |     return ::ConvertSpaceToBatchNd<hal_1_1::HalPolicy>(operation, model, data);
132 | }
133 | 
134 | bool HalPolicy::ConvertSqueeze(const Operation& operation, const Model& model, ConversionData& data)
135 | {
136 |     ALOGV("hal_1_1::HalPolicy::ConvertSqueeze()");
137 |     return ::ConvertSqueeze<hal_1_1::HalPolicy>(operation, model, data);
138 | }
139 | 
140 | bool HalPolicy::ConvertStridedSlice(const Operation& operation, const Model& model, ConversionData& data)
141 | {
142 |     ALOGV("hal_1_1::HalPolicy::ConvertStridedSlice()");
143 |     return ::ConvertStridedSlice<hal_1_1::HalPolicy>(operation, model, data);
144 | }
145 | 
146 | bool HalPolicy::ConvertTranspose(const Operation& operation, const Model& model, ConversionData& data)
147 | {
148 |     ALOGV("hal_1_1::HalPolicy::ConvertTranspose()");
149 |     return ::ConvertTranspose<hal_1_1::HalPolicy>(operation, model, data);
150 | }
151 | 
152 | bool HalPolicy::ConvertBatchToSpaceNd(const Operation& operation, const Model& model, ConversionData& data)
153 | {
154 |     ALOGV("hal_1_1::HalPolicy::ConvertBatchToSpaceNd()");
155 |     return ::ConvertBatchToSpaceNd<hal_1_1::HalPolicy>(operation, model, data);
156 | }
157 | 
158 | } // namespace hal_1_1
159 | } // namespace armnn_driver
160 | 


--------------------------------------------------------------------------------
/1.1/HalPolicy.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017-2021,2023 Arm Ltd and Contributors. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #pragma once
 7 | 
 8 | #include "../ConversionUtils.hpp"
 9 | 
10 | #include <HalInterfaces.h>
11 | 
12 | namespace V1_1 = ::android::hardware::neuralnetworks::V1_1;
13 | 
14 | namespace armnn_driver
15 | {
16 | namespace hal_1_1
17 | {
18 | 
19 | class HalPolicy
20 | {
21 | public:
22 |     using Model                     = V1_1::Model;
23 |     using Operand                   = V1_0::Operand;
24 |     using OperandLifeTime           = V1_0::OperandLifeTime;
25 |     using OperandType               = V1_0::OperandType;
26 |     using Operation                 = V1_1::Operation;
27 |     using OperationType             = V1_1::OperationType;
28 |     using getSupportedOperations_cb = V1_1::IDevice::getSupportedOperations_1_1_cb;
29 |     using ErrorStatus               = V1_0::ErrorStatus;
30 | 
31 |     static bool ConvertOperation(const Operation& operation, const Model& model, ConversionData& data);
32 | 
33 | private:
34 |     static bool ConvertElementwiseBinary(const Operation& operation,
35 |                                          const Model& model,
36 |                                          ConversionData& data,
37 |                                          armnn::BinaryOperation binaryOperation);
38 | 
39 |     static bool ConvertMean(const Operation& operation, const Model& model, ConversionData& data);
40 |     static bool ConvertPad(const Operation& operation, const Model& model, ConversionData& data);
41 |     static bool ConvertSpaceToBatchNd(const Operation& operation, const Model& model, ConversionData& data);
42 |     static bool ConvertSqueeze(const Operation& operation, const Model& model, ConversionData& data);
43 |     static bool ConvertStridedSlice(const Operation& operation, const Model& model, ConversionData& data);
44 |     static bool ConvertTranspose(const Operation& operation, const Model& model, ConversionData& data);
45 |     static bool ConvertBatchToSpaceNd(const Operation& operation, const Model& model, ConversionData& data);
46 | };
47 | 
48 | } // namespace hal_1_1
49 | } // namespace armnn_driver
50 | 


--------------------------------------------------------------------------------
/1.2/ArmnnDriverImpl.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #pragma once
 7 | 
 8 | #include <HalInterfaces.h>
 9 | 
10 | #include "../CacheDataHandler.hpp"
11 | #include "../DriverOptions.hpp"
12 | 
13 | #include <armnn/ArmNN.hpp>
14 | 
15 | #include <NeuralNetworks.h>
16 | 
17 | #ifdef ARMNN_ANDROID_R
18 | using namespace android::nn::hal;
19 | #endif
20 | 
21 | #ifdef ARMNN_ANDROID_S
22 | using namespace android::hardware;
23 | #endif
24 | 
25 | namespace V1_0 = ::android::hardware::neuralnetworks::V1_0;
26 | namespace V1_2 = ::android::hardware::neuralnetworks::V1_2;
27 | 
28 | namespace armnn_driver
29 | {
30 | namespace hal_1_2
31 | {
32 | 
33 | class ArmnnDriverImpl
34 | {
35 | public:
36 |     using HidlToken = android::hardware::hidl_array<uint8_t, ANEURALNETWORKS_BYTE_SIZE_OF_CACHE_TOKEN>;
37 | 
38 |     static Return<V1_0::ErrorStatus> prepareArmnnModel_1_2(
39 |         const armnn::IRuntimePtr& runtime,
40 |         const armnn::IGpuAccTunedParametersPtr& clTunedParameters,
41 |         const DriverOptions& options,
42 |         const V1_2::Model& model,
43 |         const android::hardware::hidl_vec<android::hardware::hidl_handle>& modelCacheHandle,
44 |         const android::hardware::hidl_vec<android::hardware::hidl_handle>& dataCacheHandle,
45 |         const HidlToken& token,
46 |         const android::sp<V1_2::IPreparedModelCallback>& cb,
47 |         bool float32ToFloat16 = false);
48 | 
49 |     static Return<V1_0::ErrorStatus> prepareModelFromCache(
50 |         const armnn::IRuntimePtr& runtime,
51 |         const DriverOptions& options,
52 |         const android::hardware::hidl_vec<android::hardware::hidl_handle>& modelCacheHandle,
53 |         const android::hardware::hidl_vec<android::hardware::hidl_handle>& dataCacheHandle,
54 |         const HidlToken& token,
55 |         const android::sp<V1_2::IPreparedModelCallback>& cb,
56 |         bool float32ToFloat16 = false);
57 | 
58 |     static Return<void> getCapabilities_1_2(const armnn::IRuntimePtr& runtime,
59 |                                             V1_2::IDevice::getCapabilities_1_2_cb cb);
60 | };
61 | 
62 | } // namespace hal_1_2
63 | } // namespace armnn_driver


--------------------------------------------------------------------------------
/1.2/HalPolicy.hpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2019-2023 Arm Ltd and Contributors. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #pragma once
  7 | 
  8 | #include "../ConversionUtils.hpp"
  9 | #include "../ConversionUtils_1_2.hpp"
 10 | 
 11 | #include <HalInterfaces.h>
 12 | 
 13 | #include <armnn/Types.hpp>
 14 | 
 15 | namespace V1_2 = ::android::hardware::neuralnetworks::V1_2;
 16 | 
 17 | namespace armnn_driver
 18 | {
 19 | class DriverOptions;
 20 | namespace hal_1_2
 21 | {
 22 | 
 23 | class HalPolicy
 24 | {
 25 | public:
 26 |     using Model                     = V1_2::Model;
 27 |     using Operand                   = V1_2::Operand;
 28 |     using OperandLifeTime           = V1_0::OperandLifeTime;
 29 |     using OperandType               = V1_2::OperandType;
 30 |     using Operation                 = V1_2::Operation;
 31 |     using OperationType             = V1_2::OperationType;
 32 |     using ExecutionCallback         = V1_2::IExecutionCallback;
 33 |     using getSupportedOperations_cb = V1_2::IDevice::getSupportedOperations_1_2_cb;
 34 |     using ErrorStatus               = V1_0::ErrorStatus;
 35 |     using DeviceType                = V1_2::DeviceType;
 36 | 
 37 |     static DeviceType GetDeviceTypeFromOptions(const DriverOptions& options);
 38 | 
 39 |     static bool ConvertOperation(const Operation& operation, const Model& model, ConversionData& data);
 40 | 
 41 | private:
 42 |     static bool ConvertArgMinMax(const Operation& operation,
 43 |                                  const Model& model,
 44 |                                  ConversionData& data,
 45 |                                  armnn::ArgMinMaxFunction argMinMaxFunction);
 46 | 
 47 |     static bool ConvertAveragePool2d(const Operation& operation, const Model& model, ConversionData& data);
 48 | 
 49 |     static bool ConvertBatchToSpaceNd(const Operation& operation, const Model& model, ConversionData& data);
 50 | 
 51 |     static bool ConvertCast(const Operation& operation, const Model& model, ConversionData& data);
 52 | 
 53 |     static bool ConvertChannelShuffle(const Operation& operation, const Model& model, ConversionData& data);
 54 | 
 55 |     static bool ConvertComparison(const Operation& operation,
 56 |                                   const Model& model,
 57 |                                   ConversionData& data,
 58 |                                   armnn::ComparisonOperation comparisonOperation);
 59 | 
 60 |     static bool ConvertConcatenation(const Operation& operation, const Model& model, ConversionData& data);
 61 | 
 62 |     static bool ConvertConv2d(const Operation& operation, const Model& model, ConversionData& data);
 63 | 
 64 |     static bool ConvertDepthToSpace(const Operation& operation, const Model& model, ConversionData& data);
 65 | 
 66 |     static bool ConvertDepthwiseConv2d(const Operation& operation, const Model& model, ConversionData& data);
 67 | 
 68 |     static bool ConvertDequantize(const Operation& operation, const Model& model, ConversionData& data);
 69 | 
 70 |     static bool ConvertExpandDims(const Operation& operation, const Model& model, ConversionData& data);
 71 | 
 72 |     static bool ConvertElementwiseBinary(const Operation& operation,
 73 |                                          const Model& model,
 74 |                                          ConversionData& data,
 75 |                                          armnn::BinaryOperation binaryOperation);
 76 | 
 77 |     static bool ConvertElementwiseUnary(const Operation& operation,
 78 |                                         const Model& model,
 79 |                                         ConversionData& data,
 80 |                                         armnn::UnaryOperation unaryOperation);
 81 | 
 82 |     static bool ConvertFloor(const Operation& operation, const Model& model, ConversionData& data);
 83 | 
 84 |     static bool ConvertFullyConnected(const Operation& operation, const Model& model, ConversionData& data);
 85 | 
 86 |     static bool ConvertGather(const Operation& operation, const Model& model, ConversionData& data);
 87 | 
 88 |     static bool ConvertGroupedConv2d(const Operation& operation, const Model& model, ConversionData& data);
 89 | 
 90 |     static bool ConvertInstanceNormalization(const Operation& operation, const Model& model, ConversionData& data);
 91 | 
 92 |     static bool ConvertL2Normalization(const Operation& operation, const Model& model, ConversionData& data);
 93 | 
 94 |     static bool ConvertL2Pool2d(const Operation& operation, const Model& model, ConversionData& data);
 95 | 
 96 |     static bool ConvertLocalResponseNormalization(const Operation& operation,
 97 |                                                   const Model& model,
 98 |                                                   ConversionData& data);
 99 | 
100 |     static bool ConvertLogistic(const Operation& operation, const Model& model, ConversionData& data);
101 | 
102 |     static bool ConvertLogSoftmax(const Operation& operation, const Model& model, ConversionData& data);
103 | 
104 |     static bool ConvertLstm(const Operation& operation, const Model& model, ConversionData& data);
105 | 
106 |     static bool ConvertMaxPool2d(const Operation& operation, const Model& model, ConversionData& data);
107 | 
108 |     static bool ConvertMean(const Operation& operation, const Model& model, ConversionData& data);
109 | 
110 |     static bool ConvertPad(const Operation& operation, const Model& model, ConversionData& data);
111 | 
112 |     static bool ConvertPadV2(const Operation& operation, const Model& model, ConversionData& data);
113 | 
114 |     static bool ConvertPrelu(const Operation& operation, const Model& model, ConversionData& data);
115 | 
116 |     static bool ConvertQuantize(const Operation& operation, const Model& model, ConversionData& data);
117 | 
118 |     static bool ConvertQuantized16BitLstm(const Operation& operation, const Model& model, ConversionData& data);
119 | 
120 |     static bool ConvertReduce(const Operation& operation,
121 |                               const Model& model,
122 |                               ConversionData& data,
123 |                               ReduceOperation reduce_operation);
124 | 
125 |     static bool ConvertReLu(const Operation& operation, const Model& model, ConversionData& data);
126 | 
127 |     static bool ConvertReLu1(const Operation& operation, const Model& model, ConversionData& data);
128 | 
129 |     static bool ConvertReLu6(const Operation& operation, const Model& model, ConversionData& data);
130 | 
131 |     static bool ConvertReshape(const Operation& operation, const Model& model, ConversionData& data);
132 | 
133 |     static bool ConvertResize(const Operation& operation,
134 |                               const Model& model,
135 |                               ConversionData& data,
136 |                               armnn::ResizeMethod resizeMethod);
137 | 
138 |     static bool ConvertSoftmax(const Operation& operation, const Model& model, ConversionData& data);
139 | 
140 |     static bool ConvertSpaceToBatchNd(const Operation& operation, const Model& model, ConversionData& data);
141 | 
142 |     static bool ConvertSpaceToDepth(const Operation& operation, const Model& model, ConversionData& data);
143 | 
144 |     static bool ConvertSplit(const Operation& operation, const Model& model, ConversionData& data);
145 | 
146 |     static bool ConvertSqrt(const Operation& operation, const Model& model, ConversionData& data);
147 | 
148 |     static bool ConvertSqueeze(const Operation& operation, const Model& model, ConversionData& data);
149 | 
150 |     static bool ConvertStridedSlice(const Operation& operation, const Model& model, ConversionData& data);
151 | 
152 |     static bool ConvertTanH(const Operation& operation, const Model& model, ConversionData& data);
153 | 
154 |     static bool ConvertTranspose(const Operation& operation, const Model& model, ConversionData& data);
155 | 
156 |     static bool ConvertTransposeConv2d(const Operation& operation, const Model& model, ConversionData& data);
157 | 
158 |     static bool ConvertTile(const Operation& operation, const Model& model, ConversionData& data);
159 | 
160 |     static bool ConvertUnidirectionalSequenceLstm(const Operation& operation,
161 |                                                   const Model& model,
162 |                                                   ConversionData& data);
163 | };
164 | 
165 | } // namespace hal_1_2
166 | } // namespace armnn_driver
167 | 


--------------------------------------------------------------------------------
/1.3/ArmnnDriverImpl.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2020 Arm Ltd. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #pragma once
 7 | 
 8 | #include <HalInterfaces.h>
 9 | 
10 | #include "../CacheDataHandler.hpp"
11 | #include "../DriverOptions.hpp"
12 | 
13 | #include <armnn/ArmNN.hpp>
14 | 
15 | #if !defined(ARMNN_ANDROID_S)
16 | using namespace android::nn::hal;
17 | #endif
18 | 
19 | #ifdef ARMNN_ANDROID_S
20 | using namespace android::hardware;
21 | #endif
22 | 
23 | namespace V1_0 = ::android::hardware::neuralnetworks::V1_0;
24 | namespace V1_2 = ::android::hardware::neuralnetworks::V1_2;
25 | namespace V1_3 = ::android::hardware::neuralnetworks::V1_3;
26 | 
27 | namespace armnn_driver
28 | {
29 | namespace hal_1_3
30 | {
31 | 
32 | class ArmnnDriverImpl
33 | {
34 | public:
35 |     using HidlToken = android::hardware::hidl_array<uint8_t, ANEURALNETWORKS_BYTE_SIZE_OF_CACHE_TOKEN>;
36 | 
37 |     static Return<V1_3::ErrorStatus> prepareArmnnModel_1_3(
38 |         const armnn::IRuntimePtr& runtime,
39 |         const armnn::IGpuAccTunedParametersPtr& clTunedParameters,
40 |         const DriverOptions& options,
41 |         const V1_3::Model& model,
42 |         const android::hardware::hidl_vec<android::hardware::hidl_handle>& modelCacheHandle,
43 |         const android::hardware::hidl_vec<android::hardware::hidl_handle>& dataCacheHandle,
44 |         const HidlToken& token,
45 |         const android::sp<V1_3::IPreparedModelCallback>& cb,
46 |         bool float32ToFloat16 = false,
47 |         V1_3::Priority priority = V1_3::Priority::MEDIUM);
48 | 
49 |     static Return<V1_3::ErrorStatus> prepareModelFromCache_1_3(
50 |         const armnn::IRuntimePtr& runtime,
51 |         const DriverOptions& options,
52 |         const android::hardware::hidl_vec<android::hardware::hidl_handle>& modelCacheHandle,
53 |         const android::hardware::hidl_vec<android::hardware::hidl_handle>& dataCacheHandle,
54 |         const HidlToken& token,
55 |         const android::sp<V1_3::IPreparedModelCallback>& cb);
56 | 
57 |     static Return<void> getCapabilities_1_3(const armnn::IRuntimePtr& runtime,
58 |                                             V1_3::IDevice::getCapabilities_1_3_cb cb);
59 | };
60 | 
61 | } // namespace hal_1_3
62 | } // namespace armnn_driver


--------------------------------------------------------------------------------
/1.3/HalPolicy.hpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2020-2023 Arm Ltd and Contributors. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #pragma once
  7 | 
  8 | #include "../ConversionUtils.hpp"
  9 | #include "../ConversionUtils_1_2.hpp"
 10 | #include "../ConversionUtils_1_3.hpp"
 11 | 
 12 | #include <HalInterfaces.h>
 13 | 
 14 | #include <armnn/Types.hpp>
 15 | 
 16 | namespace V1_3 = ::android::hardware::neuralnetworks::V1_3;
 17 | 
 18 | namespace armnn_driver
 19 | {
 20 | namespace hal_1_3
 21 | {
 22 | 
 23 | class HalPolicy
 24 | {
 25 | public:
 26 |     using Model                     = V1_3::Model;
 27 |     using Operand                   = V1_3::Operand;
 28 |     using OperandLifeTime           = V1_3::OperandLifeTime;
 29 |     using OperandType               = V1_3::OperandType;
 30 |     using Operation                 = V1_3::Operation;
 31 |     using OperationType             = V1_3::OperationType;
 32 |     using ExecutionCallback         = V1_3::IExecutionCallback;
 33 |     using getSupportedOperations_cb = V1_3::IDevice::getSupportedOperations_1_3_cb;
 34 |     using ErrorStatus               = V1_3::ErrorStatus;
 35 | 
 36 |     static bool ConvertOperation(const Operation& operation, const Model& model, ConversionData& data);
 37 | 
 38 | private:
 39 |     static bool ConvertArgMinMax(const Operation& operation,
 40 |                                  const Model& model,
 41 |                                  ConversionData& data,
 42 |                                  armnn::ArgMinMaxFunction argMinMaxFunction);
 43 | 
 44 |     static bool ConvertAveragePool2d(const Operation& operation, const Model& model, ConversionData& data);
 45 | 
 46 |     static bool ConvertBatchToSpaceNd(const Operation& operation, const Model& model, ConversionData& data);
 47 | 
 48 |     static bool ConvertCast(const Operation& operation, const Model& model, ConversionData& data);
 49 | 
 50 |     static bool ConvertChannelShuffle(const Operation& operation, const Model& model, ConversionData& data);
 51 | 
 52 |     static bool ConvertComparison(const Operation& operation,
 53 |                                   const Model& model,
 54 |                                   ConversionData& data,
 55 |                                   armnn::ComparisonOperation comparisonOperation);
 56 | 
 57 |     static bool ConvertConcatenation(const Operation& operation, const Model& model, ConversionData& data);
 58 | 
 59 |     static bool ConvertConv2d(const Operation& operation, const Model& model, ConversionData& data);
 60 | 
 61 |     static bool ConvertDepthToSpace(const Operation& operation, const Model& model, ConversionData& data);
 62 | 
 63 |     static bool ConvertDepthwiseConv2d(const Operation& operation, const Model& model, ConversionData& data);
 64 | 
 65 |     static bool ConvertDequantize(const Operation& operation, const Model& model, ConversionData& data);
 66 | 
 67 |     static bool ConvertElementwiseBinary(const Operation& operation,
 68 |                                          const Model& model,
 69 |                                          ConversionData& data,
 70 |                                          armnn::BinaryOperation binaryOperation);
 71 | 
 72 |     static bool ConvertElementwiseUnary(const Operation& operation,
 73 |                                         const Model& model,
 74 |                                         ConversionData& data,
 75 |                                         armnn::UnaryOperation unaryOperation);
 76 | 
 77 |     static bool ConvertElu(const Operation& operation, const Model& model, ConversionData& data);
 78 | 
 79 |     static bool ConvertExpandDims(const Operation& operation, const Model& model, ConversionData& data);
 80 | 
 81 |     static bool ConvertFill(const Operation& operation, const Model& model, ConversionData& data);
 82 | 
 83 |     static bool ConvertFloor(const Operation& operation, const Model& model, ConversionData& data);
 84 | 
 85 |     static bool ConvertFullyConnected(const Operation& operation, const Model& model, ConversionData& data);
 86 | 
 87 |     static bool ConvertGather(const Operation& operation, const Model& model, ConversionData& data);
 88 | 
 89 |     static bool ConvertGroupedConv2d(const Operation& operation, const Model& model, ConversionData& data);
 90 | 
 91 |     static bool ConvertHardSwish(const Operation& operation, const Model& model, ConversionData& data);
 92 | 
 93 |     static bool ConvertInstanceNormalization(const Operation& operation, const Model& model, ConversionData& data);
 94 | 
 95 |     static bool ConvertL2Normalization(const Operation& operation, const Model& model, ConversionData& data);
 96 | 
 97 |     static bool ConvertL2Pool2d(const Operation& operation, const Model& model, ConversionData& data);
 98 | 
 99 |     static bool ConvertLocalResponseNormalization(const Operation& operation,
100 |                                                   const Model& model,
101 |                                                   ConversionData& data);
102 | 
103 |     static bool ConvertLogicalBinary(const Operation& operation,
104 |                                      const Model& model,
105 |                                      ConversionData& data,
106 |                                      armnn::LogicalBinaryOperation logicalOperation);
107 | 
108 |     static bool ConvertLogistic(const Operation& operation, const Model& model, ConversionData& data);
109 | 
110 |     static bool ConvertLogSoftmax(const Operation& operation, const Model& model, ConversionData& data);
111 | 
112 |     static bool ConvertLstm(const Operation& operation, const Model& model, ConversionData& data);
113 | 
114 |     static bool ConvertMaxPool2d(const Operation& operation, const Model& model, ConversionData& data);
115 | 
116 |     static bool ConvertMean(const Operation& operation, const Model& model, ConversionData& data);
117 | 
118 |     static bool ConvertPad(const Operation& operation, const Model& model, ConversionData& data);
119 | 
120 |     static bool ConvertPadV2(const Operation& operation, const Model& model, ConversionData& data);
121 | 
122 |     static bool ConvertPrelu(const Operation& operation, const Model& model, ConversionData& data);
123 | 
124 |     static bool ConvertQuantize(const Operation& operation, const Model& model, ConversionData& data);
125 | 
126 |     static bool ConvertQuantizedLstm(const Operation& operation, const Model& model, ConversionData& data);
127 | 
128 |     static bool ConvertQuantized16BitLstm(const Operation& operation, const Model& model, ConversionData& data);
129 | 
130 |     static bool ConvertRank(const Operation& operation, const Model& model, ConversionData& data);
131 | 
132 |     static bool ConvertReduce(const Operation& operation,
133 |                               const Model& model,
134 |                               ConversionData& data,
135 |                               ReduceOperation reduceOperation);
136 | 
137 |     static bool ConvertReLu(const Operation& operation, const Model& model, ConversionData& data);
138 | 
139 |     static bool ConvertReLu1(const Operation& operation, const Model& model, ConversionData& data);
140 | 
141 |     static bool ConvertReLu6(const Operation& operation, const Model& model, ConversionData& data);
142 | 
143 |     static bool ConvertReshape(const Operation& operation, const Model& model, ConversionData& data);
144 | 
145 |     static bool ConvertResize(const Operation& operation,
146 |                               const Model& model,
147 |                               ConversionData& data,
148 |                               armnn::ResizeMethod resizeMethod);
149 | 
150 |     static bool ConvertSoftmax(const Operation& operation, const Model& model, ConversionData& data);
151 | 
152 |     static bool ConvertSpaceToBatchNd(const Operation& operation, const Model& model, ConversionData& data);
153 | 
154 |     static bool ConvertSpaceToDepth(const Operation& operation, const Model& model, ConversionData& data);
155 | 
156 |     static bool ConvertSplit(const Operation& operation, const Model& model, ConversionData& data);
157 | 
158 |     static bool ConvertSqrt(const Operation& operation, const Model& model, ConversionData& data);
159 | 
160 |     static bool ConvertSqueeze(const Operation& operation, const Model& model, ConversionData& data);
161 | 
162 |     static bool ConvertStridedSlice(const Operation& operation, const Model& model, ConversionData& data);
163 | 
164 |     static bool ConvertTanH(const Operation& operation, const Model& model, ConversionData& data);
165 | 
166 |     static bool ConvertTranspose(const Operation& operation, const Model& model, ConversionData& data);
167 | 
168 |     static bool ConvertTransposeConv2d(const Operation& operation, const Model& model, ConversionData& data);
169 | 
170 |     static bool ConvertTile(const Operation& operation, const Model& model, ConversionData& data);
171 | 
172 |     static bool ConvertUnidirectionalSequenceLstm(const Operation& operation,
173 |                                                   const Model& model,
174 |                                                   ConversionData& data);
175 | };
176 | 
177 | } // namespace hal_1_3
178 | } // namespace armnn_driver
179 | 


--------------------------------------------------------------------------------
/Android.bp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 ARM Ltd. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | ////////////////////////////////////////////
 7 | //                                        //
 8 | //           flatbuffers libs             //
 9 | //                                        //
10 | ////////////////////////////////////////////
11 | cc_defaults {
12 |     name: "libflatbuffers-defaults",
13 |     proprietary: true,
14 |     export_include_dirs: [ "flatbuffers/",
15 |                            "flatbuffers/include",
16 |     ],
17 |     local_include_dirs: ["flatbuffers/include",],
18 |     cflags: [
19 |         "-O3",
20 |         "-fexceptions",
21 |         "-Wno-unused-parameter",
22 |         "-DFLATBUFFERS_BUILD_FLATC=1"
23 |     ],
24 |     cppflags: [
25 |         "-std=c++14"
26 |     ],
27 |     rtti: true,
28 | }
29 | 
30 | cc_library_static {
31 |     name: "libflatbuffers-framework",
32 |     defaults: ["libflatbuffers-defaults"],
33 |     srcs: [
34 |         "flatbuffers/src/flatc.cpp",
35 |         "flatbuffers/src/flatc_main.cpp",
36 |     ],
37 | }
38 | 
39 | subdirs = [
40 |     "armnn",
41 | ]
42 | 


--------------------------------------------------------------------------------
/ArmnnDevice.cpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2017, 2023 Arm Ltd. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #define LOG_TAG "ArmnnDriver"
  7 | 
  8 | #include "ArmnnDevice.hpp"
  9 | 
 10 | #include <OperationsUtils.h>
 11 | 
 12 | #include <log/log.h>
 13 | 
 14 | #include <memory>
 15 | #include <string>
 16 | 
 17 | using namespace android;
 18 | 
 19 | namespace
 20 | {
 21 | 
 22 | std::string GetBackendString(const armnn_driver::DriverOptions& options)
 23 | {
 24 |     std::stringstream backends;
 25 |     for (auto&& b : options.GetBackends())
 26 |     {
 27 |         backends << b << " ";
 28 |     }
 29 |     return backends.str();
 30 | }
 31 | 
 32 | } // anonymous namespace
 33 | 
 34 | namespace armnn_driver
 35 | {
 36 | 
 37 | ArmnnDevice::ArmnnDevice(DriverOptions options)
 38 |     : m_Runtime(nullptr, nullptr)
 39 |     , m_ClTunedParameters(nullptr)
 40 |     , m_Options(std::move(options))
 41 | {
 42 |     ALOGV("ArmnnDevice::ArmnnDevice()");
 43 | 
 44 |     armnn::ConfigureLogging(false, m_Options.IsVerboseLoggingEnabled(), armnn::LogSeverity::Trace);
 45 |     if (m_Options.IsVerboseLoggingEnabled())
 46 |     {
 47 |         SetMinimumLogSeverity(base::VERBOSE);
 48 |     }
 49 |     else
 50 |     {
 51 |         SetMinimumLogSeverity(base::INFO);
 52 |     }
 53 | 
 54 |     armnn::IRuntime::CreationOptions runtimeOptions;
 55 | 
 56 | #if defined(ARMCOMPUTECL_ENABLED)
 57 |     try
 58 |     {
 59 |         if (!m_Options.GetClTunedParametersFile().empty())
 60 |         {
 61 |             m_ClTunedParameters = armnn::IGpuAccTunedParameters::Create(m_Options.GetClTunedParametersMode(),
 62 |                                                                         m_Options.GetClTuningLevel());
 63 |             try
 64 |             {
 65 |                 m_ClTunedParameters->Load(m_Options.GetClTunedParametersFile().c_str());
 66 |             }
 67 |             catch (std::exception& error)
 68 |             {
 69 |                 // This is only a warning because the file won't exist the first time you are generating it.
 70 |                 ALOGW("ArmnnDevice: Failed to load CL tuned parameters file '%s': %s",
 71 |                       m_Options.GetClTunedParametersFile().c_str(), error.what());
 72 |             }
 73 |             runtimeOptions.m_GpuAccTunedParameters = m_ClTunedParameters;
 74 |         }
 75 |     }
 76 |     catch (const armnn::ClRuntimeUnavailableException& error)
 77 |     {
 78 |         ALOGE("ArmnnDevice: Failed to setup CL runtime: %s. Device will be unavailable.", error.what());
 79 |     }
 80 |     catch (std::exception& error)
 81 |     {
 82 |         ALOGE("ArmnnDevice: Unknown exception: %s. Device will be unavailable.", error.what());
 83 |     }
 84 | #endif
 85 |     runtimeOptions.m_EnableGpuProfiling = m_Options.IsGpuProfilingEnabled();
 86 |     m_Runtime = armnn::IRuntime::Create(runtimeOptions);
 87 | 
 88 |     std::vector<armnn::BackendId> backends;
 89 | 
 90 |     if (m_Runtime)
 91 |     {
 92 |         const armnn::BackendIdSet supportedDevices = m_Runtime->GetDeviceSpec().GetSupportedBackends();
 93 |         for (auto &backend : m_Options.GetBackends())
 94 |         {
 95 |             if (std::find(supportedDevices.cbegin(), supportedDevices.cend(), backend) == supportedDevices.cend())
 96 |             {
 97 |                 ALOGW("ArmnnDevice: Requested unknown backend %s", backend.Get().c_str());
 98 |             }
 99 |             else
100 |             {
101 |                 backends.push_back(backend);
102 |             }
103 |         }
104 |     }
105 | 
106 |     if (backends.empty())
107 |     {
108 |         // No known backend specified
109 |         throw armnn::InvalidArgumentException("ArmnnDevice: No known backend specified.");
110 |     }
111 | 
112 |     m_Options.SetBackends(backends);
113 |     ALOGV("ArmnnDevice: Created device with the following backends: %s",
114 |           GetBackendString(m_Options).c_str());
115 | }
116 | 
117 | } // namespace armnn_driver
118 | 


--------------------------------------------------------------------------------
/ArmnnDevice.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #pragma once
 7 | 
 8 | #include "DriverOptions.hpp"
 9 | 
10 | #include <armnn/ArmNN.hpp>
11 | 
12 | namespace armnn_driver
13 | {
14 | 
15 | class ArmnnDevice
16 | {
17 | protected:
18 |     ArmnnDevice(DriverOptions options);
19 |     virtual ~ArmnnDevice() {}
20 | 
21 | protected:
22 |     armnn::IRuntimePtr m_Runtime;
23 |     armnn::IGpuAccTunedParametersPtr m_ClTunedParameters;
24 |     DriverOptions m_Options;
25 | };
26 | 
27 | } // namespace armnn_driver
28 | 


--------------------------------------------------------------------------------
/ArmnnDriver.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #pragma once
 7 | 
 8 | #include <HalInterfaces.h>
 9 | 
10 | #include <log/log.h>
11 | 
12 | #ifdef ARMNN_ANDROID_NN_V1_3 // Using ::android::hardware::neuralnetworks::V1_3
13 | 
14 | #include "1.1/ArmnnDriver.hpp"
15 | #include "1.2/ArmnnDriver.hpp"
16 | #include "1.3/ArmnnDriver.hpp"
17 | 
18 | namespace armnn_driver
19 | {
20 | 
21 | class ArmnnDriver : public hal_1_3::ArmnnDriver
22 | {
23 | public:
24 |     ArmnnDriver(DriverOptions options)
25 |         : hal_1_3::ArmnnDriver(std::move(options))
26 |     {
27 |         ALOGV("ArmnnDriver::ArmnnDriver()");
28 |     }
29 |     ~ArmnnDriver() {}
30 | };
31 | 
32 | } // namespace armnn_driver
33 | #elif ARMNN_ANDROID_NN_V1_2 // Using ::android::hardware::neuralnetworks::V1_2
34 | 
35 | #include "1.1/ArmnnDriver.hpp"
36 | #include "1.2/ArmnnDriver.hpp"
37 | 
38 | namespace armnn_driver
39 | {
40 | 
41 | class ArmnnDriver : public hal_1_2::ArmnnDriver
42 | {
43 | public:
44 |     ArmnnDriver(DriverOptions options)
45 |         : hal_1_2::ArmnnDriver(std::move(options))
46 |     {
47 |         ALOGV("ArmnnDriver::ArmnnDriver()");
48 |     }
49 |     ~ArmnnDriver() {}
50 | };
51 | 
52 | } // namespace armnn_driver
53 | #elif ARMNN_ANDROID_NN_V1_1 // Using ::android::hardware::neuralnetworks::V1_1
54 | 
55 | #include "1.1/ArmnnDriver.hpp"
56 | 
57 | namespace armnn_driver
58 | {
59 | 
60 | class ArmnnDriver : public hal_1_1::ArmnnDriver
61 | {
62 | public:
63 |     ArmnnDriver(DriverOptions options)
64 |         : hal_1_1::ArmnnDriver(std::move(options))
65 |     {
66 |         ALOGV("ArmnnDriver::ArmnnDriver()");
67 |     }
68 |     ~ArmnnDriver() {}
69 | };
70 | 
71 | } // namespace armnn_driver
72 | 
73 | #else // Fallback to ::android::hardware::neuralnetworks::V1_0
74 | 
75 | #include "1.0/ArmnnDriver.hpp"
76 | 
77 | namespace armnn_driver
78 | {
79 | 
80 | class ArmnnDriver : public hal_1_0::ArmnnDriver
81 | {
82 | public:
83 |     ArmnnDriver(DriverOptions options)
84 |         : hal_1_0::ArmnnDriver(std::move(options))
85 |     {
86 |         ALOGV("ArmnnDriver::ArmnnDriver()");
87 |     }
88 |     ~ArmnnDriver() {}
89 | };
90 | 
91 | } // namespace armnn_driver
92 | 
93 | #endif
94 | 


--------------------------------------------------------------------------------
/ArmnnDriverImpl.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #pragma once
 7 | 
 8 | #include "DriverOptions.hpp"
 9 | 
10 | #include <HalInterfaces.h>
11 | 
12 | #ifdef ARMNN_ANDROID_R
13 | using namespace android::nn::hal;
14 | #endif
15 | 
16 | #ifdef ARMNN_ANDROID_S
17 | using namespace android::hardware;
18 | #endif
19 | 
20 | namespace V1_0 = ::android::hardware::neuralnetworks::V1_0;
21 | namespace V1_1 = ::android::hardware::neuralnetworks::V1_1;
22 | 
23 | #ifdef ARMNN_ANDROID_NN_V1_2 // Using ::android::hardware::neuralnetworks::V1_2
24 | namespace V1_2 = ::android::hardware::neuralnetworks::V1_2;
25 | #endif
26 | 
27 | #ifdef ARMNN_ANDROID_NN_V1_3 // Using ::android::hardware::neuralnetworks::V1_3
28 | namespace V1_2 = ::android::hardware::neuralnetworks::V1_2;
29 | namespace V1_3 = ::android::hardware::neuralnetworks::V1_3;
30 | #endif
31 | 
32 | namespace armnn_driver
33 | {
34 | 
35 | template <typename Callback, typename Context>
36 | struct CallbackContext
37 | {
38 |     Callback callback;
39 |     Context ctx;
40 | };
41 | 
42 | template<typename HalPolicy>
43 | class ArmnnDriverImpl
44 | {
45 | public:
46 |     using HalModel                     = typename HalPolicy::Model;
47 |     using HalGetSupportedOperations_cb = typename HalPolicy::getSupportedOperations_cb;
48 |     using HalErrorStatus               = typename HalPolicy::ErrorStatus;
49 | 
50 |     static Return<void> getSupportedOperations(
51 |             const armnn::IRuntimePtr& runtime,
52 |             const DriverOptions& options,
53 |             const HalModel& model,
54 |             HalGetSupportedOperations_cb);
55 | 
56 |     static Return<V1_0::ErrorStatus> prepareModel(
57 |             const armnn::IRuntimePtr& runtime,
58 |             const armnn::IGpuAccTunedParametersPtr& clTunedParameters,
59 |             const DriverOptions& options,
60 |             const HalModel& model,
61 |             const android::sp<V1_0::IPreparedModelCallback>& cb,
62 |             bool float32ToFloat16 = false);
63 | 
64 |     static Return<V1_0::DeviceStatus> getStatus();
65 | 
66 | };
67 | 
68 | } // namespace armnn_driver
69 | 


--------------------------------------------------------------------------------
/ArmnnPreparedModel.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #pragma once
 7 | 
 8 | #include "ArmnnDriver.hpp"
 9 | #include "ArmnnDriverImpl.hpp"
10 | #include "RequestThread.hpp"
11 | 
12 | #include <NeuralNetworks.h>
13 | #include <armnn/ArmNN.hpp>
14 | 
15 | #include <string>
16 | #include <vector>
17 | 
18 | namespace armnn_driver
19 | {
20 | using armnnExecuteCallback_1_0 = std::function<void(V1_0::ErrorStatus status, std::string callingFunction)>;
21 | 
22 | struct ArmnnCallback_1_0
23 | {
24 |     armnnExecuteCallback_1_0 callback;
25 | };
26 | 
27 | struct ExecutionContext_1_0 {};
28 | 
29 | using CallbackContext_1_0 = CallbackContext<armnnExecuteCallback_1_0, ExecutionContext_1_0>;
30 | 
31 | template <typename HalVersion>
32 | class ArmnnPreparedModel : public V1_0::IPreparedModel
33 | {
34 | public:
35 |     using HalModel = typename HalVersion::Model;
36 | 
37 |     ArmnnPreparedModel(armnn::NetworkId networkId,
38 |                        armnn::IRuntime* runtime,
39 |                        const HalModel& model,
40 |                        const std::string& requestInputsAndOutputsDumpDir,
41 |                        const bool gpuProfilingEnabled,
42 |                        const bool importEnabled = false,
43 |                        const bool exportEnabled = false);
44 | 
45 |     virtual ~ArmnnPreparedModel();
46 | 
47 |     virtual Return<V1_0::ErrorStatus> execute(const V1_0::Request& request,
48 |                                               const ::android::sp<V1_0::IExecutionCallback>& callback) override;
49 | 
50 |     /// execute the graph prepared from the request
51 |     void ExecuteGraph(std::shared_ptr<std::vector<::android::nn::RunTimePoolInfo>>& pMemPools,
52 |                       armnn::InputTensors& inputTensors,
53 |                       armnn::OutputTensors& outputTensors,
54 |                       CallbackContext_1_0 callback);
55 | 
56 |     /// Executes this model with dummy inputs (e.g. all zeroes).
57 |     /// \return false on failure, otherwise true
58 |     bool ExecuteWithDummyInputs();
59 | 
60 | private:
61 | 
62 |     template <typename TensorBindingCollection>
63 |     void DumpTensorsIfRequired(char const* tensorNamePrefix, const TensorBindingCollection& tensorBindings);
64 | 
65 |     armnn::NetworkId                          m_NetworkId;
66 |     armnn::IRuntime*                          m_Runtime;
67 |     HalModel                                  m_Model;
68 |     // There must be a single RequestThread for all ArmnnPreparedModel objects to ensure serial execution of workloads
69 |     // It is specific to this class, so it is declared as static here
70 |     static RequestThread<ArmnnPreparedModel,
71 |                          HalVersion,
72 |                          CallbackContext_1_0> m_RequestThread;
73 |     uint32_t                                  m_RequestCount;
74 |     const std::string&                        m_RequestInputsAndOutputsDumpDir;
75 |     const bool                                m_GpuProfilingEnabled;
76 |     const bool m_EnableImport;
77 |     const bool m_EnableExport;
78 | };
79 | 
80 | }
81 | 


--------------------------------------------------------------------------------
/ArmnnPreparedModel_1_2.hpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2017 Arm Ltd. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #pragma once
  7 | 
  8 | #include "ArmnnDriver.hpp"
  9 | #include "ArmnnDriverImpl.hpp"
 10 | #include "RequestThread.hpp"
 11 | #include "ModelToINetworkConverter.hpp"
 12 | 
 13 | #include <NeuralNetworks.h>
 14 | #include <armnn/ArmNN.hpp>
 15 | 
 16 | #include <string>
 17 | #include <vector>
 18 | 
 19 | namespace armnn_driver
 20 | {
 21 | 
 22 | using CallbackAsync_1_2 = std::function<
 23 |                                 void(V1_0::ErrorStatus errorStatus,
 24 |                                      std::vector<::android::hardware::neuralnetworks::V1_2::OutputShape> outputShapes,
 25 |                                      const ::android::hardware::neuralnetworks::V1_2::Timing& timing,
 26 |                                      std::string callingFunction)>;
 27 | 
 28 | struct ExecutionContext_1_2
 29 | {
 30 |     ::android::hardware::neuralnetworks::V1_2::MeasureTiming    measureTimings =
 31 |         ::android::hardware::neuralnetworks::V1_2::MeasureTiming::NO;
 32 |     TimePoint driverStart;
 33 | };
 34 | 
 35 | using CallbackContext_1_2 = CallbackContext<CallbackAsync_1_2, ExecutionContext_1_2>;
 36 | 
 37 | template <typename HalVersion>
 38 | class ArmnnPreparedModel_1_2 : public V1_2::IPreparedModel
 39 | {
 40 | public:
 41 |     using HalModel = typename V1_2::Model;
 42 | 
 43 |     ArmnnPreparedModel_1_2(armnn::NetworkId networkId,
 44 |                            armnn::IRuntime* runtime,
 45 |                            const HalModel& model,
 46 |                            const std::string& requestInputsAndOutputsDumpDir,
 47 |                            const bool gpuProfilingEnabled,
 48 |                            const bool importEnabled = false,
 49 |                            const bool exportEnabled = false);
 50 | 
 51 |     ArmnnPreparedModel_1_2(armnn::NetworkId networkId,
 52 |                            armnn::IRuntime* runtime,
 53 |                            const std::string& requestInputsAndOutputsDumpDir,
 54 |                            const bool gpuProfilingEnabled,
 55 |                            const bool importEnabled = false,
 56 |                            const bool exportEnabled = false,
 57 |                            const bool preparedFromCache = false);
 58 | 
 59 |     virtual ~ArmnnPreparedModel_1_2();
 60 | 
 61 |     virtual Return<V1_0::ErrorStatus> execute(const V1_0::Request& request,
 62 |                                               const ::android::sp<V1_0::IExecutionCallback>& callback) override;
 63 | 
 64 |     virtual Return<V1_0::ErrorStatus> execute_1_2(const V1_0::Request& request, V1_2::MeasureTiming measure,
 65 |                                                   const ::android::sp<V1_2::IExecutionCallback>& callback) override;
 66 | 
 67 |     virtual Return<void> executeSynchronously(const V1_0::Request &request,
 68 |                                               V1_2::MeasureTiming measure,
 69 |                                               V1_2::IPreparedModel::executeSynchronously_cb cb) override;
 70 | 
 71 |     virtual Return<void> configureExecutionBurst(
 72 |             const ::android::sp<V1_2::IBurstCallback>& callback,
 73 |             const android::hardware::MQDescriptorSync<V1_2::FmqRequestDatum>& requestChannel,
 74 |             const android::hardware::MQDescriptorSync<V1_2::FmqResultDatum>& resultChannel,
 75 |             configureExecutionBurst_cb cb) override;
 76 | 
 77 |     /// execute the graph prepared from the request
 78 |     template<typename CallbackContext>
 79 |     bool ExecuteGraph(std::shared_ptr<std::vector<::android::nn::RunTimePoolInfo>>& pMemPools,
 80 |                       armnn::InputTensors& inputTensors,
 81 |                       armnn::OutputTensors& outputTensors,
 82 |                       CallbackContext callback);
 83 | 
 84 |     /// Executes this model with dummy inputs (e.g. all zeroes).
 85 |     /// \return false on failure, otherwise true
 86 |     bool ExecuteWithDummyInputs(unsigned int numInputs, unsigned int numOutputs);
 87 | 
 88 | private:
 89 | 
 90 |     Return<V1_0::ErrorStatus> Execute(const V1_0::Request& request,
 91 |                                       V1_2::MeasureTiming measureTiming,
 92 |                                       CallbackAsync_1_2 callback);
 93 | 
 94 |     Return<V1_0::ErrorStatus> PrepareMemoryForInputs(
 95 |             armnn::InputTensors& inputs,
 96 |             const V1_0::Request& request,
 97 |             const std::vector<android::nn::RunTimePoolInfo>& memPools);
 98 | 
 99 |     Return<V1_0::ErrorStatus> PrepareMemoryForOutputs(
100 |             armnn::OutputTensors& outputs,
101 |             std::vector<V1_2::OutputShape> &outputShapes,
102 |             const V1_0::Request& request,
103 |             const std::vector<android::nn::RunTimePoolInfo>& memPools);
104 | 
105 |     Return <V1_0::ErrorStatus> PrepareMemoryForIO(
106 |             armnn::InputTensors& inputs,
107 |             armnn::OutputTensors& outputs,
108 |             std::vector<android::nn::RunTimePoolInfo>& memPools,
109 |             const V1_0::Request& request,
110 |             CallbackAsync_1_2 callback);
111 | 
112 |     template <typename TensorBindingCollection>
113 |     void DumpTensorsIfRequired(char const* tensorNamePrefix, const TensorBindingCollection& tensorBindings);
114 | 
115 |     armnn::NetworkId                          m_NetworkId;
116 |     armnn::IRuntime*                          m_Runtime;
117 |     V1_2::Model                               m_Model;
118 |     // There must be a single RequestThread for all ArmnnPreparedModel objects to ensure serial execution of workloads
119 |     // It is specific to this class, so it is declared as static here
120 |     static RequestThread<ArmnnPreparedModel_1_2,
121 |                          HalVersion,
122 |                          CallbackContext_1_2> m_RequestThread;
123 |     uint32_t                                  m_RequestCount;
124 |     const std::string&                        m_RequestInputsAndOutputsDumpDir;
125 |     const bool                                m_GpuProfilingEnabled;
126 |     const bool                                m_EnableImport;
127 |     const bool                                m_EnableExport;
128 |     const bool                                m_PreparedFromCache;
129 | };
130 | 
131 | }
132 | 


--------------------------------------------------------------------------------
/ArmnnPreparedModel_1_3.hpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2020 Arm Ltd. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #pragma once
  7 | 
  8 | #include "ArmnnDriver.hpp"
  9 | #include "ArmnnDriverImpl.hpp"
 10 | #include "RequestThread_1_3.hpp"
 11 | #include "ModelToINetworkConverter.hpp"
 12 | 
 13 | #include <NeuralNetworks.h>
 14 | #include <armnn/ArmNN.hpp>
 15 | 
 16 | 
 17 | #include <string>
 18 | #include <vector>
 19 | 
 20 | namespace armnn_driver
 21 | {
 22 | using CallbackAsync_1_3 = std::function<
 23 |                                 void(V1_3::ErrorStatus errorStatus,
 24 |                                 std::vector<::android::hardware::neuralnetworks::V1_2::OutputShape> outputShapes,
 25 |                                 const ::android::hardware::neuralnetworks::V1_2::Timing& timing,
 26 |                                 std::string callingFunction)>;
 27 | 
 28 | struct ExecutionContext_1_3
 29 | {
 30 |     ::android::hardware::neuralnetworks::V1_2::MeasureTiming    measureTimings =
 31 |         ::android::hardware::neuralnetworks::V1_2::MeasureTiming::NO;
 32 |     TimePoint driverStart;
 33 |     TimePoint driverEnd;
 34 |     TimePoint deviceStart;
 35 |     TimePoint deviceEnd;
 36 | };
 37 | 
 38 | using CallbackContext_1_3 = CallbackContext<CallbackAsync_1_3, ExecutionContext_1_3>;
 39 | 
 40 | using executeFenced_cb = std::function<void(::android::hardware::neuralnetworks::V1_3::ErrorStatus status,
 41 |     const ::android::hardware::hidl_handle& syncFence,
 42 |     const ::android::sp<::android::hardware::neuralnetworks::V1_3::IFencedExecutionCallback>& callback)>;
 43 | 
 44 | template <typename HalVersion>
 45 | class ArmnnPreparedModel_1_3 : public V1_3::IPreparedModel
 46 | {
 47 | public:
 48 |     using HalModel = typename V1_3::Model;
 49 | 
 50 |     ArmnnPreparedModel_1_3(armnn::NetworkId networkId,
 51 |                            armnn::IRuntime* runtime,
 52 |                            const HalModel& model,
 53 |                            const std::string& requestInputsAndOutputsDumpDir,
 54 |                            const bool gpuProfilingEnabled,
 55 |                            V1_3::Priority priority = V1_3::Priority::MEDIUM,
 56 |                            const bool importEnabled = false,
 57 |                            const bool exportEnabled = false);
 58 | 
 59 |     ArmnnPreparedModel_1_3(armnn::NetworkId networkId,
 60 |                            armnn::IRuntime* runtime,
 61 |                            const std::string& requestInputsAndOutputsDumpDir,
 62 |                            const bool gpuProfilingEnabled,
 63 |                            V1_3::Priority priority = V1_3::Priority::MEDIUM,
 64 |                            const bool importEnabled = false,
 65 |                            const bool exportEnabled = false,
 66 |                            const bool preparedFromCache = false);
 67 | 
 68 |     virtual ~ArmnnPreparedModel_1_3();
 69 | 
 70 |     Return<V1_0::ErrorStatus> execute(const V1_0::Request& request,
 71 |                                       const ::android::sp<V1_0::IExecutionCallback>& callback) override;
 72 | 
 73 |     Return<V1_0::ErrorStatus> execute_1_2(const V1_0::Request& request, V1_2::MeasureTiming measure,
 74 |                                           const ::android::sp<V1_2::IExecutionCallback>& callback) override;
 75 | 
 76 |     Return<V1_3::ErrorStatus> execute_1_3(const V1_3::Request& request,
 77 |                                           V1_2::MeasureTiming measure,
 78 |                                           const V1_3::OptionalTimePoint&,
 79 |                                           const V1_3::OptionalTimeoutDuration&,
 80 |                                           const ::android::sp<V1_3::IExecutionCallback>& callback) override;
 81 | 
 82 |     Return<void> executeSynchronously(const V1_0::Request &request,
 83 |                                       V1_2::MeasureTiming measure,
 84 |                                       V1_3::IPreparedModel::executeSynchronously_cb cb) override;
 85 | 
 86 |     Return<void> executeSynchronously_1_3(const V1_3::Request &request,
 87 |                                           V1_2::MeasureTiming measure,
 88 |                                           const V1_3::OptionalTimePoint& deadline,
 89 |                                           const V1_3::OptionalTimeoutDuration& loopTimeoutDuration,
 90 |                                           V1_3::IPreparedModel::executeSynchronously_1_3_cb cb) override;
 91 | 
 92 |     Return<void> executeFenced(const V1_3::Request& request,
 93 |                                const android::hardware::hidl_vec<android::hardware::hidl_handle>& fenceWaitFor,
 94 |                                V1_2::MeasureTiming measure,
 95 |                                const V1_3::OptionalTimePoint& deadline,
 96 |                                const V1_3::OptionalTimeoutDuration& loopTimeoutDuration,
 97 |                                const V1_3::OptionalTimeoutDuration& duration,
 98 |                                executeFenced_cb callback) override;
 99 | 
100 |     Return<void> configureExecutionBurst(
101 |             const ::android::sp<V1_2::IBurstCallback>& callback,
102 |             const android::hardware::MQDescriptorSync<V1_2::FmqRequestDatum>& requestChannel,
103 |             const android::hardware::MQDescriptorSync<V1_2::FmqResultDatum>& resultChannel,
104 |             configureExecutionBurst_cb cb) override;
105 | 
106 |     template<typename CallbackContext>
107 |     Return<void> ExecuteSynchronously(const V1_3::Request& request, CallbackContext cbCtx);
108 | 
109 |     /// execute the graph prepared from the request
110 |     template<typename CallbackContext>
111 |     Return <V1_3::ErrorStatus> ExecuteGraph(
112 |               std::shared_ptr<std::vector<::android::nn::RunTimePoolInfo>>& pMemPools,
113 |               armnn::InputTensors& inputTensors,
114 |               armnn::OutputTensors& outputTensors,
115 |               CallbackContext callback);
116 | 
117 |     /// Executes this model with dummy inputs (e.g. all zeroes).
118 |     /// \return false on failure, otherwise true
119 |     bool ExecuteWithDummyInputs(unsigned int numInputs, unsigned int numOutputs);
120 | 
121 |     V1_3::Priority GetModelPriority();
122 | 
123 | private:
124 | 
125 |     Return <V1_3::ErrorStatus> Execute(const V1_3::Request& request,
126 |                                        V1_2::MeasureTiming measureTiming,
127 |                                        CallbackAsync_1_3 callback);
128 | 
129 |     Return<V1_3::ErrorStatus> PrepareMemoryForInputs(
130 |         armnn::InputTensors& inputs,
131 |         const V1_3::Request& request,
132 |         const std::vector<android::nn::RunTimePoolInfo>& memPools);
133 | 
134 |     Return<V1_3::ErrorStatus> PrepareMemoryForOutputs(
135 |         armnn::OutputTensors& outputs,
136 |         std::vector<V1_2::OutputShape> &outputShapes,
137 |         const V1_3::Request& request,
138 |         const std::vector<android::nn::RunTimePoolInfo>& memPools);
139 | 
140 |     std::tuple<V1_3::ErrorStatus, hidl_vec<V1_2::OutputShape>, V1_2::Timing, std::string> PrepareMemoryForIO(
141 |         armnn::InputTensors& inputs,
142 |         armnn::OutputTensors& outputs,
143 |         std::vector<android::nn::RunTimePoolInfo>& memPools,
144 |         const V1_3::Request& request);
145 | 
146 |     template <typename TensorBindingCollection>
147 |     void DumpTensorsIfRequired(char const* tensorNamePrefix, const TensorBindingCollection& tensorBindings);
148 | 
149 |     armnn::NetworkId                               m_NetworkId;
150 |     armnn::IRuntime*                               m_Runtime;
151 |     V1_3::Model                                    m_Model;
152 |     // There must be a single RequestThread for all ArmnnPreparedModel objects to ensure serial execution of workloads
153 |     // It is specific to this class, so it is declared as static here
154 |     static RequestThread_1_3<ArmnnPreparedModel_1_3,
155 |                              HalVersion,
156 |                              CallbackContext_1_3>  m_RequestThread;
157 |     uint32_t                                       m_RequestCount;
158 |     const std::string&                             m_RequestInputsAndOutputsDumpDir;
159 |     const bool                                     m_GpuProfilingEnabled;
160 |     V1_3::Priority                                 m_ModelPriority;
161 | 
162 |     const bool                                     m_EnableImport;
163 |     const bool                                     m_EnableExport;
164 |     const bool                                     m_PreparedFromCache;
165 | };
166 | 
167 | }
168 | 


--------------------------------------------------------------------------------
/CacheDataHandler.cpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2021 Arm Ltd and Contributors. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #include "CacheDataHandler.hpp"
 7 | 
 8 | #include <log/log.h>
 9 | 
10 | namespace armnn_driver
11 | {
12 | 
13 | CacheDataHandler& CacheDataHandlerInstance()
14 | {
15 |     static CacheDataHandler instance;
16 |     return instance;
17 | }
18 | 
19 | void CacheDataHandler::Register(const HidlToken token, const size_t hashValue, const size_t cacheSize)
20 | {
21 |     if (m_CacheDataMap.find(hashValue) != m_CacheDataMap.end()
22 |                         && m_CacheDataMap.at(hashValue).GetToken() == token
23 |                         && m_CacheDataMap.at(hashValue).GetCacheSize() == cacheSize)
24 |     {
25 |         ALOGV("CacheHandler::Register() Hash value has already registered.");
26 |         return;
27 |     }
28 |     CacheHandle cacheHandle(token, cacheSize);
29 |     m_CacheDataMap.insert({hashValue, cacheHandle});
30 | }
31 | 
32 | bool CacheDataHandler::Validate(const HidlToken token, const size_t hashValue, const size_t cacheSize) const
33 | {
34 |     return (m_CacheDataMap.find(hashValue) != m_CacheDataMap.end()
35 |                              && m_CacheDataMap.at(hashValue).GetToken() == token
36 |                              && m_CacheDataMap.at(hashValue).GetCacheSize() == cacheSize);
37 | }
38 | 
39 | size_t CacheDataHandler::Hash(std::vector<uint8_t>& cacheData)
40 | {
41 |     std::size_t hash = cacheData.size();
42 |     for (auto& i : cacheData)
43 |     {
44 |         hash = ((hash << 5) - hash) + i;
45 |     }
46 |     return hash;
47 | }
48 | 
49 | size_t CacheDataHandler::GetCacheSize(HidlToken token)
50 | {
51 |     for (auto i = m_CacheDataMap.begin(); i != m_CacheDataMap.end(); ++i)
52 |     {
53 |         if (i->second.GetToken() == token)
54 |         {
55 |             return i->second.GetCacheSize();
56 |         }
57 |     }
58 |     return 0;
59 | }
60 | 
61 | void CacheDataHandler::Clear()
62 | {
63 |     m_CacheDataMap.clear();
64 | }
65 | 
66 | } // armnn_driver
67 | 


--------------------------------------------------------------------------------
/CacheDataHandler.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2021 Arm Ltd and Contributors. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #pragma once
 7 | 
 8 | #include <HalInterfaces.h>
 9 | 
10 | #include <vector>
11 | #include <unordered_map>
12 | 
13 | #include <NeuralNetworks.h>
14 | 
15 | namespace armnn_driver
16 | {
17 | 
18 | using HidlToken = android::hardware::hidl_array<uint8_t, ANEURALNETWORKS_BYTE_SIZE_OF_CACHE_TOKEN>;
19 | 
20 | class CacheHandle
21 | {
22 | public:
23 |     CacheHandle(const HidlToken token, const size_t cacheSize)
24 |     : m_HidlToken(token), m_CacheSize(cacheSize) {}
25 | 
26 |     ~CacheHandle() {};
27 | 
28 |     HidlToken GetToken() const
29 |     {
30 |         return m_HidlToken;
31 |     }
32 | 
33 |     size_t GetCacheSize() const
34 |     {
35 |         return m_CacheSize;
36 |     }
37 | 
38 | private:
39 |     const HidlToken m_HidlToken;
40 |     const size_t m_CacheSize;
41 | };
42 | 
43 | class CacheDataHandler
44 | {
45 | public:
46 |     CacheDataHandler() {}
47 |     ~CacheDataHandler() {}
48 | 
49 |     void Register(const HidlToken token, const size_t hashValue, const size_t cacheSize);
50 | 
51 |     bool Validate(const HidlToken token, const size_t hashValue, const size_t cacheSize) const;
52 | 
53 |     size_t Hash(std::vector<uint8_t>& cacheData);
54 | 
55 |     size_t GetCacheSize(HidlToken token);
56 | 
57 |     void Clear();
58 | 
59 | private:
60 |     CacheDataHandler(const CacheDataHandler&) = delete;
61 |     CacheDataHandler& operator=(const CacheDataHandler&) = delete;
62 | 
63 |     std::unordered_map<size_t, CacheHandle> m_CacheDataMap;
64 | };
65 | 
66 | CacheDataHandler& CacheDataHandlerInstance();
67 | 
68 | } // armnn_driver
69 | 


--------------------------------------------------------------------------------
/ConversionUtils.cpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2017,2022 Arm Ltd and Contributors. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #include "ConversionUtils.hpp"
  7 | #include <armnnUtils/Permute.hpp>
  8 | 
  9 | ///
 10 | /// Helper classes
 11 | ///
 12 | 
 13 | namespace armnn_driver
 14 | {
 15 | 
 16 | LayerInputHandle::LayerInputHandle()
 17 |     : m_OutputSlot(nullptr)
 18 |     , m_Valid(false)
 19 | {}
 20 | 
 21 | LayerInputHandle::LayerInputHandle(bool valid, armnn::IOutputSlot* outputSlot, armnn::TensorInfo tensorInfo)
 22 |     : m_OutputSlot(outputSlot)
 23 |     , m_Valid(valid)
 24 |     , m_TensorInfo(tensorInfo)
 25 | {}
 26 | 
 27 | bool LayerInputHandle::IsValid() const
 28 | {
 29 |     return m_Valid;
 30 | }
 31 | 
 32 | void LayerInputHandle::Connect(armnn::IInputSlot& inputSlot)
 33 | {
 34 |     if (!IsValid())
 35 |     {
 36 |         throw armnn::RuntimeException("LayerInputHandle is invalid");
 37 |     }
 38 | 
 39 |     if (m_OutputSlot)
 40 |     {
 41 |         m_OutputSlot->Connect(inputSlot);
 42 |     }
 43 | }
 44 | 
 45 | void LayerInputHandle::Disconnect(armnn::IInputSlot& inputSlot)
 46 | {
 47 |     if (!IsValid())
 48 |     {
 49 |         throw armnn::RuntimeException("LayerInputHandle is invalid");
 50 |     }
 51 |     if (m_OutputSlot)
 52 |     {
 53 |         m_OutputSlot->Disconnect(inputSlot);
 54 |     }
 55 | }
 56 | 
 57 | const armnn::TensorInfo& LayerInputHandle::GetTensorInfo() const
 58 | {
 59 |     return m_TensorInfo;
 60 | }
 61 | 
 62 | void LayerInputHandle::SanitizeQuantizationScale(LayerInputHandle& weight,
 63 |                                                  LayerInputHandle& input)
 64 | {
 65 |     if (m_OutputSlot)
 66 |     {
 67 |         armnn::TensorInfo weightInfo = weight.GetTensorInfo();
 68 |         armnn::TensorInfo inputInfo = input.GetTensorInfo();
 69 |         armnn::TensorInfo biasInfo = GetTensorInfo();
 70 | 
 71 |         SanitizeBiasQuantizationScale(biasInfo, weightInfo, inputInfo);
 72 | 
 73 |         m_TensorInfo = biasInfo;
 74 |         m_OutputSlot->SetTensorInfo(biasInfo);
 75 |     }
 76 | }
 77 | 
 78 | ConstTensorPin::ConstTensorPin(bool optional)
 79 |     : m_Optional(optional)
 80 | {}
 81 | 
 82 | ConstTensorPin::ConstTensorPin(armnn::TensorInfo& tensorInfo,
 83 |                                const void* valueStart,
 84 |                                uint32_t numBytes,
 85 |                                const armnn::PermutationVector& mappings)
 86 |     : m_Optional(false)
 87 | {
 88 |     armnn::IgnoreUnused(numBytes);
 89 |     if (tensorInfo.GetNumBytes() != numBytes)
 90 |     {
 91 |         ALOGW("The size of ConstTensor does not match its TensorInfo.");
 92 |     }
 93 | 
 94 |     const bool needsSwizzling = (mappings.GetSize() > 0);
 95 |     if (needsSwizzling)
 96 |     {
 97 |         m_SwizzledTensorData.resize(tensorInfo.GetNumBytes());
 98 |         SwizzleAndroidNn4dTensorToArmNn(tensorInfo, valueStart, m_SwizzledTensorData.data(), mappings);
 99 | 
100 |         m_ConstTensor = armnn::ConstTensor(tensorInfo, m_SwizzledTensorData.data());
101 |     }
102 |     else
103 |     {
104 |         m_ConstTensor = armnn::ConstTensor(tensorInfo, valueStart);
105 |     }
106 | }
107 | 
108 | bool ConstTensorPin::IsValid() const
109 | {
110 |     return m_ConstTensor.GetMemoryArea() != nullptr;
111 | }
112 | 
113 | bool ConstTensorPin::IsOptional() const
114 | {
115 |     return m_Optional;
116 | }
117 | 
118 | const armnn::ConstTensor& ConstTensorPin::GetConstTensor() const
119 | {
120 |     return m_ConstTensor;
121 | }
122 | 
123 | const armnn::ConstTensor* ConstTensorPin::GetConstTensorPtr() const
124 | {
125 |     if (IsValid() && m_ConstTensor.GetNumElements() > 0)
126 |     {
127 |         return &m_ConstTensor;
128 |     }
129 |     // tensor is either invalid, or has no elements (indicating an optional tensor that was not provided)
130 |     return nullptr;
131 | }
132 | 
133 | ///
134 | /// Utility functions
135 | ///
136 | 
137 | armnn::IConnectableLayer* ProcessActivation(const armnn::TensorInfo& tensorInfo,
138 |                                             ActivationFn activation,
139 |                                             armnn::IConnectableLayer* prevLayer,
140 |                                             ConversionData& data)
141 | {
142 |     if (prevLayer->GetNumOutputSlots() != 1)
143 |     {
144 |         Fail("%s: Incorrect Number of OutputSlots expected 1 was %i", __func__, prevLayer->GetNumOutputSlots());
145 |         return nullptr;
146 |     }
147 |     prevLayer->GetOutputSlot(0).SetTensorInfo(tensorInfo);
148 | 
149 |     armnn::IConnectableLayer* activationLayer = prevLayer;
150 | 
151 |     if (activation != ActivationFn::kActivationNone)
152 |     {
153 |         armnn::ActivationDescriptor activationDesc;
154 |         switch (activation)
155 |         {
156 |             case ActivationFn::kActivationRelu:
157 |             {
158 |                 activationDesc.m_Function = armnn::ActivationFunction::ReLu;
159 |                 break;
160 |             }
161 |             case ActivationFn::kActivationRelu1:
162 |             {
163 |                 activationDesc.m_Function = armnn::ActivationFunction::BoundedReLu;
164 |                 activationDesc.m_A = 1.0f;
165 |                 activationDesc.m_B = -1.0f;
166 |                 break;
167 |             }
168 |             case ActivationFn::kActivationRelu6:
169 |             {
170 |                 activationDesc.m_Function = armnn::ActivationFunction::BoundedReLu;
171 |                 activationDesc.m_A = 6.0f;
172 |                 break;
173 |             }
174 |             case ActivationFn::kActivationSigmoid:
175 |             {
176 |                 activationDesc.m_Function = armnn::ActivationFunction::Sigmoid;
177 |                 break;
178 |             }
179 |             case ActivationFn::kActivationTanh:
180 |             {
181 |                 activationDesc.m_Function = armnn::ActivationFunction::TanH;
182 |                 activationDesc.m_A = 1.0f;
183 |                 activationDesc.m_B = 1.0f;
184 |                 break;
185 |             }
186 |             default:
187 |             {
188 |                 Fail("%s: Invalid activation enum value %i", __func__, activation);
189 |                 return nullptr;
190 |             }
191 |         }
192 | 
193 |         bool isSupported = false;
194 |         armnn::BackendId setBackend;
195 |         FORWARD_LAYER_SUPPORT_FUNC(__func__,
196 |                                    IsActivationSupported,
197 |                                    data.m_Backends,
198 |                                    isSupported,
199 |                                    setBackend,
200 |                                    prevLayer->GetOutputSlot(0).GetTensorInfo(),
201 |                                    tensorInfo,
202 |                                    activationDesc);
203 |         if (!isSupported)
204 |         {
205 |             return nullptr;
206 |         }
207 | 
208 |         activationLayer = data.m_Network->AddActivationLayer(activationDesc);
209 |         activationLayer->SetBackendId(setBackend);
210 | 
211 |         prevLayer->GetOutputSlot(0).Connect(activationLayer->GetInputSlot(0));
212 |         activationLayer->GetOutputSlot(0).SetTensorInfo(tensorInfo);
213 |     }
214 | 
215 |     return activationLayer;
216 | }
217 | 
218 | } // namespace armnn_driver
219 | 


--------------------------------------------------------------------------------
/DriverOptions.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #pragma once
 7 | 
 8 | #include <armnn/ArmNN.hpp>
 9 | 
10 | #include <set>
11 | #include <string>
12 | #include <vector>
13 | 
14 | namespace armnn_driver
15 | {
16 | 
17 | class DriverOptions
18 | {
19 | public:
20 |     DriverOptions(armnn::Compute computeDevice, bool fp16Enabled = false);
21 |     DriverOptions(const std::vector<armnn::BackendId>& backends, bool fp16Enabled);
22 |     DriverOptions(int argc, char** argv);
23 |     DriverOptions(DriverOptions&& other) = default;
24 | 
25 |     const std::vector<armnn::BackendId>& GetBackends() const { return m_Backends; }
26 |     bool IsVerboseLoggingEnabled() const { return m_VerboseLogging; }
27 |     const std::string& GetRequestInputsAndOutputsDumpDir() const { return m_RequestInputsAndOutputsDumpDir; }
28 |     const std::string& GetServiceName() const { return m_ServiceName; }
29 |     const std::set<unsigned int>& GetForcedUnsupportedOperations() const { return m_ForcedUnsupportedOperations; }
30 |     const std::string& GetClTunedParametersFile() const { return m_ClTunedParametersFile; }
31 |     const std::string& GetClMLGOTunedParametersFile() const { return m_ClMLGOTunedParametersFile; }
32 |     armnn::IGpuAccTunedParameters::Mode GetClTunedParametersMode() const { return m_ClTunedParametersMode; }
33 |     armnn::IGpuAccTunedParameters::TuningLevel GetClTuningLevel() const { return m_ClTuningLevel; }
34 |     bool IsGpuProfilingEnabled() const { return m_EnableGpuProfiling; }
35 |     bool IsFastMathEnabled() const { return m_FastMathEnabled; }
36 |     bool GetFp16Enabled() const { return m_fp16Enabled; }
37 |     void SetBackends(const std::vector<armnn::BackendId>& backends) { m_Backends = backends; }
38 |     bool ShouldExit() const { return m_ShouldExit; }
39 |     int GetExitCode() const { return m_ExitCode; }
40 |     const std::string& GetCachedNetworkFilePath() const { return m_CachedNetworkFilePath; }
41 |     bool SaveCachedNetwork() const { return m_SaveCachedNetwork; }
42 |     unsigned int GetNumberOfThreads() const { return m_NumberOfThreads; }
43 |     bool isImportEnabled() const { return m_EnableImport; };
44 |     bool isExportEnabled() const { return m_EnableExport; };
45 | 
46 | private:
47 |     std::vector<armnn::BackendId> m_Backends;
48 |     bool m_VerboseLogging;
49 |     std::string m_RequestInputsAndOutputsDumpDir;
50 |     std::string m_ServiceName;
51 |     std::set<unsigned int> m_ForcedUnsupportedOperations;
52 |     std::string m_ClTunedParametersFile;
53 |     std::string m_ClMLGOTunedParametersFile;
54 |     armnn::IGpuAccTunedParameters::Mode m_ClTunedParametersMode;
55 |     armnn::IGpuAccTunedParameters::TuningLevel m_ClTuningLevel;
56 |     bool m_EnableGpuProfiling;
57 |     bool m_fp16Enabled;
58 |     bool m_FastMathEnabled;
59 |     bool m_ShouldExit;
60 |     int m_ExitCode;
61 |     std::string m_CachedNetworkFilePath;
62 |     bool m_SaveCachedNetwork;
63 |     unsigned int m_NumberOfThreads;
64 |     bool m_EnableImport;
65 |     bool m_EnableExport;
66 | };
67 | 
68 | } // namespace armnn_driver
69 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2017 ARM Limited.
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/LICENSES/MIT.txt:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) <year> <copyright holders>
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:
 6 | 
 7 | The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.
 8 | 
 9 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
10 | 


--------------------------------------------------------------------------------
/ModelToINetworkConverter.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #pragma once
 7 | 
 8 | #include "ArmnnDriver.hpp"
 9 | #include "ConversionUtils.hpp"
10 | 
11 | #include <armnn/ArmNN.hpp>
12 | 
13 | #include <set>
14 | #include <vector>
15 | 
16 | namespace armnn_driver
17 | {
18 | 
19 | enum class ConversionResult
20 | {
21 |     Success,
22 |     ErrorMappingPools,
23 |     UnsupportedFeature
24 | };
25 | 
26 | // A helper template class performing the conversion from an AndroidNN driver Model representation,
27 | // to an armnn::INetwork object
28 | template<typename HalPolicy>
29 | class ModelToINetworkConverter
30 | {
31 | public:
32 |     using HalModel = typename HalPolicy::Model;
33 | 
34 |     ModelToINetworkConverter(const std::vector<armnn::BackendId>& backends,
35 |                              const HalModel& model,
36 |                              const std::set<unsigned int>& forcedUnsupportedOperations);
37 | 
38 |     ConversionResult GetConversionResult() const { return m_ConversionResult; }
39 | 
40 |     // Returns the ArmNN INetwork corresponding to the input model, if preparation went smoothly, nullptr otherwise.
41 |     armnn::INetwork* GetINetwork() const { return m_Data.m_Network.get(); }
42 | 
43 |     bool IsOperationSupported(uint32_t operationIndex) const;
44 | 
45 | private:
46 |     void Convert();
47 | 
48 |     // Shared aggregate input/output/internal data
49 |     ConversionData m_Data;
50 | 
51 |     // Input data
52 |     const HalModel&               m_Model;
53 |     const std::set<unsigned int>& m_ForcedUnsupportedOperations;
54 | 
55 |     // Output data
56 |     ConversionResult         m_ConversionResult;
57 |     std::map<uint32_t, bool> m_OperationSupported;
58 | };
59 | 
60 | } // armnn_driver
61 | 


--------------------------------------------------------------------------------
/NnapiSupport.txt:
--------------------------------------------------------------------------------
  1 | ------ ArmNN for Android NNAPI supported operations ------
  2 | 
  3 | This release of ArmNN for Android supports use as a driver for the Android Neural Networks API. It implements the
  4 | android.hardware.neuralnetworks@1.0, android.hardware.neuralnetworks@1.1, android.hardware.neuralnetworks@1.2 and
  5 | android.hardware.neuralnetworks@1.3
  6 | HAL interfaces.
  7 | 
  8 | For more information on the Android Neural Networks API, see https://developer.android.com/ndk/guides/neuralnetworks/index.html
  9 | 
 10 | For integration and usage documentation, please see README.md.
 11 | 
 12 | --- Support for Android Neural Networks HAL operations ---
 13 | 
 14 | The following AndroidNN HAL 1.0, 1.1, 1.2 and 1.3 operations are currently supported:
 15 | 
 16 | AndroidNN operator           Tensor type supported
 17 | ABS                          (FLOAT32, FLOAT16, INT32)
 18 | ADD                          (FLOAT32, FLOAT16, INT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 19 | ARGMAX                       (FLOAT32, FLOAT16, INT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 20 | ARGMIN                       (FLOAT32, FLOAT16, INT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 21 | AVERAGE_POOL_2D              (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 22 | BATCH_TO_SPACE_ND            (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 23 | CAST                         (FLOAT32, FLOAT16, INT32, QUANT8_ASYMM)
 24 | CHANNEL_SHUFFLE              (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 25 | CONCATENATION                (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 26 | CONV_2D                      (FLOAT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 27 | DEPTH_TO_SPACE               (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 28 | DEPTHWISE_CONV_2D            (FLOAT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 29 | DEQUANTIZE                   (FLOAT32 (output only), QUANT8_ASYMM and QUANT8_ASYMM_SIGNED (input only))
 30 | DIV                          (FLOAT32, FLOAT16, INT32)
 31 | ELU                          (FLOAT32, FLOAT16, QUANT8_ASYMM)
 32 | EQUAL                        (BOOL8, FLOAT32, FLOAT16, INT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 33 | EXP                          (FLOAT32, FLOAT16)
 34 | EXPAND_DIMS                  (FLOAT32, FLOAT16, INT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 35 | FILL                         (FLOAT32, FLOAT16, INT32)
 36 | FLOOR                        (FLOAT32, FLOAT16)
 37 | FULLY_CONNECTED              (FLOAT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 38 | GATHER                       (FLOAT32, FLOAT16, INT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 39 | GREATER                      (BOOL8, FLOAT32, FLOAT16, INT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 40 | GREATER_EQUAL                (BOOL8, FLOAT32, FLOAT16, INT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 41 | GROUPED_CONV_2D              (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 42 | HARD_SWISH                   (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 43 | INSTANCE_NORMALIZATION       (FLOAT32, FLOAT16)
 44 | L2_NORMALIZATION             (FLOAT32)
 45 | L2_POOL_2D                   (FLOAT32, FLOAT16)
 46 | LESS                         (BOOL8, FLOAT32, FLOAT16, INT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 47 | LESS_EQUAL                   (BOOL8, FLOAT32, FLOAT16, INT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 48 | LOCAL_RESPONSE_NORMALIZATION (FLOAT32)
 49 | LOG                          (FLOAT32, FLOAT16)
 50 | LOGICAL_AND                  (BOOL8)
 51 | LOGICAL_NOT                  (BOOL8)
 52 | LOGICAL_OR                   (BOOL8)
 53 | LOGISTIC                     (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 54 | LOG_SOFTMAX                  (FLOAT32, FLOAT16)
 55 | LSTM                         (FLOAT32)
 56 | MAXIMUM                      (FLOAT32, FLOAT16, INT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 57 | MAX_POOL_2D                  (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 58 | MEAN                         (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 59 | MINIMUM                      (FLOAT32, FLOAT16, INT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 60 | MUL                          (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 61 | NEG                          (FLOAT32, FLOAT16)
 62 | NOT_EQUAL                    (BOOL8, FLOAT32, FLOAT16, INT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 63 | PAD                          (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 64 | PAD_V2                       (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 65 | POW                          (FLOAT32, FLOAT16)
 66 | PRELU                        (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 67 | QUANTIZE                     (FLOAT32 (input only), QUANT8_ASYMM and QUANT8_ASYMM_SIGNED (output only))
 68 | QUANTIZED_16BIT_LSTM         (QUANT8_ASYMM)
 69 | QUANTIZED_LSTM               (QUANT8_ASYMM)
 70 | RANK                         (FLOAT32, FLOAT16, INT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 71 | REDUCE_MAX                   (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 72 | REDUCE_MIN                   (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 73 | REDUCE_PROD                  (FLOAT32, FLOAT16)
 74 | REDUCE_SUM                   (FLOAT32, FLOAT16)
 75 | RELU                         (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 76 | RELU1                        (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 77 | RELU6                        (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 78 | RESHAPE                      (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 79 | RESIZE_BILINEAR              (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 80 | RESIZE_NEAREST_NEIGHBOR      (FLOAT32, FLOAT16, QUANT8_ASYMM)
 81 | RSQRT                        (FLOAT32, FLOAT16)
 82 | SIN                          (FLOAT32, FLOAT16)
 83 | SOFTMAX                      (FLOAT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 84 | SPACE_TO_BATCH_ND            (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 85 | SPACE_TO_DEPTH               (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 86 | SPLIT                        (FLOAT32, FLOAT16, INT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 87 | SQRT                         (FLOAT32, FLOAT16)
 88 | SQUEEZE                      (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 89 | STRIDED_SLICE                (FLOAT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 90 | SUB                          (FLOAT32, FLOAT16, INT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 91 | TANH                         (FLOAT32, FLOAT16, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 92 | TILE                         (All data types)
 93 | TRANSPOSE                    (FLOAT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 94 | TRANSPOSE_CONV_2D            (FLOAT32, QUANT8_ASYMM, QUANT8_ASYMM_SIGNED)
 95 | UNIDIRECTIONAL_SEQUENCE_LSTM (FLOAT32, FLOAT16)
 96 | 
 97 | Where operations are not supported by the ArmNN Android NN Driver, the driver indicates this to the framework
 98 | appropriately and the framework implements those operations using a CPU implementation.
 99 | 
100 | NOTE: By convention, only those tensor types have been listed above, which are fully supported across all
101 | ArmNN backends.
102 |     - FLOAT16 input tensors are partially supported on most HAL 1.2 and 1.3 operators on the GpuAcc and
103 |     CpuRef backends, however not on CpuAcc.
104 | 


--------------------------------------------------------------------------------
/NnapiSupport.txt.license:
--------------------------------------------------------------------------------
1 | #
2 | # Copyright © 2018-2022 Arm Ltd and Contributors. All rights reserved.
3 | # SPDX-License-Identifier: MIT
4 | #
5 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | # Arm NN Android Neural Networks driver
 2 | 
 3 | This directory contains the Arm NN driver for the Android Neural Networks API, implementing the HIDL based android.hardware.neuralnetworks@1.0, android.hardware.neuralnetworks@1.1, android.hardware.neuralnetworks@1.2 and android.hardware.neuralnetworks@1.3 HALs.
 4 | 
 5 | For Android 11 and lower, the NNAPI uses HIDL based HALs.
 6 | 
 7 | For Android 12 and Android 13, the NNAPI HAL revision uses AIDL instead of HIDL, and HIDL is deprecated.
 8 | 
 9 | For Android 14 the compatibility matrix no longer includes support for HIDL HAL revisions:
10 | https://android.googlesource.com/platform/hardware/interfaces/+/refs/heads/android14-qpr1-release/compatibility_matrices/compatibility_matrix.8.xml
11 | 
12 | For more information about supported operations and configurations, see [NnapiSupport.txt](NnapiSupport.txt)
13 | 
14 | For documentation about integrating this driver into an Android tree, see [Integrator Guide](docs/IntegratorGuide.md)
15 | 
16 | For FAQs and troubleshooting advice, see [FAQ.md](docs/FAQ.md)
17 | 
18 | ### License
19 | 
20 | The android-nn-driver is provided under the [MIT](https://spdx.org/licenses/MIT.html) license.
21 | See [LICENSE](LICENSE) for more information. Contributions to this project are accepted under the same license.
22 | 
23 | Individual files contain the following tag instead of the full license text.
24 | 
25 |     SPDX-License-Identifier: MIT
26 | 
27 | This enables machine processing of license information based on the SPDX License Identifiers that are available here: http://spdx.org/licenses/
28 | 


--------------------------------------------------------------------------------
/README.md.license:
--------------------------------------------------------------------------------
1 | #
2 | # Copyright © 2018-2021 Arm Ltd and Contributors. All rights reserved.
3 | # SPDX-License-Identifier: MIT
4 | #
5 | 


--------------------------------------------------------------------------------
/RequestThread.cpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #define LOG_TAG "ArmnnDriver"
  7 | 
  8 | #include "RequestThread.hpp"
  9 | #include "ArmnnPreparedModel.hpp"
 10 | 
 11 | #ifdef ARMNN_ANDROID_NN_V1_2
 12 | #include "ArmnnPreparedModel_1_2.hpp"
 13 | #endif
 14 | 
 15 | #ifdef ARMNN_ANDROID_NN_V1_3
 16 | #include "ArmnnPreparedModel_1_2.hpp"
 17 | #include "ArmnnPreparedModel_1_3.hpp"
 18 | #endif
 19 | 
 20 | #include <log/log.h>
 21 | 
 22 | using namespace android;
 23 | 
 24 | namespace armnn_driver
 25 | {
 26 | 
 27 | template <template <typename HalVersion> class PreparedModel, typename HalVersion, typename CallbackContext>
 28 | RequestThread<PreparedModel, HalVersion, CallbackContext>::RequestThread()
 29 | {
 30 |     ALOGV("RequestThread::RequestThread()");
 31 |     m_Thread = std::make_unique<std::thread>(&RequestThread::Process, this);
 32 | }
 33 | 
 34 | template <template <typename HalVersion> class PreparedModel, typename HalVersion, typename CallbackContext>
 35 | RequestThread<PreparedModel, HalVersion, CallbackContext>::~RequestThread()
 36 | {
 37 |     ALOGV("RequestThread::~RequestThread()");
 38 | 
 39 |     try
 40 |     {
 41 |         // Coverity fix: The following code may throw an exception of type std::length_error.
 42 | 
 43 |         // This code is meant to to terminate the inner thread gracefully by posting an EXIT message
 44 |         // to the thread's message queue. However, according to Coverity, this code could throw an exception and fail.
 45 |         // Since only one static instance of RequestThread is used in the driver (in ArmnnPreparedModel),
 46 |         // this destructor is called only when the application has been closed, which means that
 47 |         // the inner thread will be terminated anyway, although abruptly, in the event that the destructor code throws.
 48 |         // Wrapping the destructor's code with a try-catch block simply fixes the Coverity bug.
 49 | 
 50 |         // Post an EXIT message to the thread
 51 |         std::shared_ptr<AsyncExecuteData> nulldata(nullptr);
 52 |         auto pMsg = std::make_shared<ThreadMsg>(ThreadMsgType::EXIT, nulldata);
 53 |         PostMsg(pMsg);
 54 |         // Wait for the thread to terminate, it is deleted automatically
 55 |         m_Thread->join();
 56 |     }
 57 |     catch (const std::exception&) { } // Swallow any exception.
 58 | }
 59 | 
 60 | template <template <typename HalVersion> class PreparedModel, typename HalVersion, typename CallbackContext>
 61 | void RequestThread<PreparedModel, HalVersion, CallbackContext>::PostMsg(PreparedModel<HalVersion>* model,
 62 |         std::shared_ptr<std::vector<::android::nn::RunTimePoolInfo>>& memPools,
 63 |         std::shared_ptr<armnn::InputTensors>& inputTensors,
 64 |         std::shared_ptr<armnn::OutputTensors>& outputTensors,
 65 |         CallbackContext callbackContext)
 66 | {
 67 |     ALOGV("RequestThread::PostMsg(...)");
 68 |     auto data = std::make_shared<AsyncExecuteData>(model,
 69 |                                                    memPools,
 70 |                                                    inputTensors,
 71 |                                                    outputTensors,
 72 |                                                    callbackContext);
 73 |     auto pMsg = std::make_shared<ThreadMsg>(ThreadMsgType::REQUEST, data);
 74 |     PostMsg(pMsg);
 75 | }
 76 | 
 77 | template <template <typename HalVersion> class PreparedModel, typename HalVersion, typename CallbackContext>
 78 | void RequestThread<PreparedModel, HalVersion, CallbackContext>::PostMsg(std::shared_ptr<ThreadMsg>& pMsg)
 79 | {
 80 |     ALOGV("RequestThread::PostMsg(pMsg)");
 81 |     // Add a message to the queue and notify the request thread
 82 |     std::unique_lock<std::mutex> lock(m_Mutex);
 83 |     m_Queue.push(pMsg);
 84 |     m_Cv.notify_one();
 85 | }
 86 | 
 87 | template <template <typename HalVersion> class PreparedModel, typename HalVersion, typename CallbackContext>
 88 | void RequestThread<PreparedModel, HalVersion, CallbackContext>::Process()
 89 | {
 90 |     ALOGV("RequestThread::Process()");
 91 |     while (true)
 92 |     {
 93 |         std::shared_ptr<ThreadMsg> pMsg(nullptr);
 94 |         {
 95 |             // Wait for a message to be added to the queue
 96 |             // This is in a separate scope to minimise the lifetime of the lock
 97 |             std::unique_lock<std::mutex> lock(m_Mutex);
 98 |             while (m_Queue.empty())
 99 |             {
100 |                 m_Cv.wait(lock);
101 |             }
102 |             // get the message to process from the front of the queue
103 |             pMsg = m_Queue.front();
104 |             m_Queue.pop();
105 |         }
106 | 
107 |         switch (pMsg->type)
108 |         {
109 |             case ThreadMsgType::REQUEST:
110 |             {
111 |                 ALOGV("RequestThread::Process() - request");
112 |                 // invoke the asynchronous execution method
113 |                 PreparedModel<HalVersion>* model = pMsg->data->m_Model;
114 |                 model->ExecuteGraph(pMsg->data->m_MemPools,
115 |                                     *(pMsg->data->m_InputTensors),
116 |                                     *(pMsg->data->m_OutputTensors),
117 |                                     pMsg->data->m_CallbackContext);
118 |                 break;
119 |             }
120 | 
121 |             case ThreadMsgType::EXIT:
122 |             {
123 |                 ALOGV("RequestThread::Process() - exit");
124 |                 // delete all remaining messages (there should not be any)
125 |                 std::unique_lock<std::mutex> lock(m_Mutex);
126 |                 while (!m_Queue.empty())
127 |                 {
128 |                     m_Queue.pop();
129 |                 }
130 |                 return;
131 |             }
132 | 
133 |             default:
134 |                 // this should be unreachable
135 |                 throw armnn::RuntimeException("ArmNN: RequestThread: invalid message type");
136 |         }
137 |     }
138 | }
139 | 
140 | ///
141 | /// Class template specializations
142 | ///
143 | 
144 | template class RequestThread<ArmnnPreparedModel, hal_1_0::HalPolicy, CallbackContext_1_0>;
145 | 
146 | #ifdef ARMNN_ANDROID_NN_V1_1
147 | template class RequestThread<armnn_driver::ArmnnPreparedModel, hal_1_1::HalPolicy, CallbackContext_1_0>;
148 | #endif
149 | 
150 | #ifdef ARMNN_ANDROID_NN_V1_2
151 | template class RequestThread<ArmnnPreparedModel, hal_1_1::HalPolicy, CallbackContext_1_0>;
152 | template class RequestThread<ArmnnPreparedModel, hal_1_2::HalPolicy, CallbackContext_1_0>;
153 | template class RequestThread<ArmnnPreparedModel_1_2, hal_1_2::HalPolicy, CallbackContext_1_2>;
154 | #endif
155 | 
156 | #ifdef ARMNN_ANDROID_NN_V1_3
157 | template class RequestThread<ArmnnPreparedModel, hal_1_1::HalPolicy, CallbackContext_1_0>;
158 | template class RequestThread<ArmnnPreparedModel, hal_1_2::HalPolicy, CallbackContext_1_0>;
159 | template class RequestThread<ArmnnPreparedModel, hal_1_3::HalPolicy, CallbackContext_1_0>;
160 | template class RequestThread<ArmnnPreparedModel_1_2, hal_1_2::HalPolicy, CallbackContext_1_2>;
161 | #endif
162 | 
163 | } // namespace armnn_driver
164 | 


--------------------------------------------------------------------------------
/RequestThread.hpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2017 Arm Ltd. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #pragma once
  7 | 
  8 | #include <queue>
  9 | #include <thread>
 10 | #include <mutex>
 11 | #include <condition_variable>
 12 | 
 13 | #include "ArmnnDriver.hpp"
 14 | #include "ArmnnDriverImpl.hpp"
 15 | 
 16 | #include <CpuExecutor.h>
 17 | #include <armnn/ArmNN.hpp>
 18 | 
 19 | namespace armnn_driver
 20 | {
 21 | using TimePoint = std::chrono::steady_clock::time_point;
 22 | static const TimePoint g_Min = std::chrono::steady_clock::time_point::min();
 23 | 
 24 | template<template <typename HalVersion> class PreparedModel, typename HalVersion, typename CallbackContext>
 25 | class RequestThread
 26 | {
 27 | public:
 28 |     /// Constructor creates the thread
 29 |     RequestThread();
 30 | 
 31 |     /// Destructor terminates the thread
 32 |     ~RequestThread();
 33 | 
 34 |     /// Add a message to the thread queue.
 35 |     /// @param[in] model pointer to the prepared model handling the request
 36 |     /// @param[in] memPools pointer to the memory pools vector for the tensors
 37 |     /// @param[in] inputTensors pointer to the input tensors for the request
 38 |     /// @param[in] outputTensors pointer to the output tensors for the request
 39 |     /// @param[in] callback the android notification callback
 40 |     void PostMsg(PreparedModel<HalVersion>* model,
 41 |                  std::shared_ptr<std::vector<::android::nn::RunTimePoolInfo>>& memPools,
 42 |                  std::shared_ptr<armnn::InputTensors>& inputTensors,
 43 |                  std::shared_ptr<armnn::OutputTensors>& outputTensors,
 44 |                  CallbackContext callbackContext);
 45 | 
 46 | private:
 47 |     RequestThread(const RequestThread&) = delete;
 48 |     RequestThread& operator=(const RequestThread&) = delete;
 49 | 
 50 |     /// storage for a prepared model and args for the asyncExecute call
 51 |     struct AsyncExecuteData
 52 |     {
 53 |         AsyncExecuteData(PreparedModel<HalVersion>* model,
 54 |                          std::shared_ptr<std::vector<::android::nn::RunTimePoolInfo>>& memPools,
 55 |                          std::shared_ptr<armnn::InputTensors>& inputTensors,
 56 |                          std::shared_ptr<armnn::OutputTensors>& outputTensors,
 57 |                          CallbackContext callbackContext)
 58 |             : m_Model(model)
 59 |             , m_MemPools(memPools)
 60 |             , m_InputTensors(inputTensors)
 61 |             , m_OutputTensors(outputTensors)
 62 |             , m_CallbackContext(callbackContext)
 63 |         {
 64 |         }
 65 | 
 66 |         PreparedModel<HalVersion>* m_Model;
 67 |         std::shared_ptr<std::vector<::android::nn::RunTimePoolInfo>> m_MemPools;
 68 |         std::shared_ptr<armnn::InputTensors> m_InputTensors;
 69 |         std::shared_ptr<armnn::OutputTensors> m_OutputTensors;
 70 |         CallbackContext m_CallbackContext;
 71 |     };
 72 |     enum class ThreadMsgType
 73 |     {
 74 |         EXIT,                   // exit the thread
 75 |         REQUEST                 // user request to process
 76 |     };
 77 | 
 78 |     /// storage for the thread message type and data
 79 |     struct ThreadMsg
 80 |     {
 81 |         ThreadMsg(ThreadMsgType msgType,
 82 |                   std::shared_ptr<AsyncExecuteData>& msgData)
 83 |             : type(msgType)
 84 |             , data(msgData)
 85 |         {
 86 |         }
 87 | 
 88 |         ThreadMsgType type;
 89 |         std::shared_ptr<AsyncExecuteData> data;
 90 |     };
 91 | 
 92 |     /// Add a prepared thread message to the thread queue.
 93 |     /// @param[in] threadMsg the message to add to the queue
 94 |     void PostMsg(std::shared_ptr<ThreadMsg>& pThreadMsg);
 95 | 
 96 |     /// Entry point for the request thread
 97 |     void Process();
 98 | 
 99 |     std::unique_ptr<std::thread> m_Thread;
100 |     std::queue<std::shared_ptr<ThreadMsg>> m_Queue;
101 |     std::mutex m_Mutex;
102 |     std::condition_variable m_Cv;
103 | };
104 | 
105 | } // namespace armnn_driver
106 | 


--------------------------------------------------------------------------------
/RequestThread_1_3.cpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2020 Arm Ltd and Contributors. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #define LOG_TAG "ArmnnDriver"
  7 | 
  8 | #include "ArmnnPreparedModel_1_3.hpp"
  9 | #include "RequestThread_1_3.hpp"
 10 | 
 11 | #include <log/log.h>
 12 | 
 13 | using namespace android;
 14 | 
 15 | namespace armnn_driver
 16 | {
 17 | 
 18 | template <template <typename HalVersion> class PreparedModel, typename HalVersion, typename CallbackContext>
 19 | RequestThread_1_3<PreparedModel, HalVersion, CallbackContext>::RequestThread_1_3()
 20 | {
 21 |     ALOGV("RequestThread_1_3::RequestThread_1_3()");
 22 |     m_Thread = std::make_unique<std::thread>(&RequestThread_1_3::Process, this);
 23 | }
 24 | 
 25 | template <template <typename HalVersion> class PreparedModel, typename HalVersion, typename CallbackContext>
 26 | RequestThread_1_3<PreparedModel, HalVersion, CallbackContext>::~RequestThread_1_3()
 27 | {
 28 |     ALOGV("RequestThread_1_3::~RequestThread_1_3()");
 29 | 
 30 |     try
 31 |     {
 32 |         // Coverity fix: The following code may throw an exception of type std::length_error.
 33 | 
 34 |         // This code is meant to to terminate the inner thread gracefully by posting an EXIT message
 35 |         // to the thread's message queue. However, according to Coverity, this code could throw an exception and fail.
 36 |         // Since only one static instance of RequestThread is used in the driver (in ArmnnPreparedModel),
 37 |         // this destructor is called only when the application has been closed, which means that
 38 |         // the inner thread will be terminated anyway, although abruptly, in the event that the destructor code throws.
 39 |         // Wrapping the destructor's code with a try-catch block simply fixes the Coverity bug.
 40 | 
 41 |         // Post an EXIT message to the thread
 42 |         std::shared_ptr<AsyncExecuteData> nulldata(nullptr);
 43 |         auto pMsg = std::make_shared<ThreadMsg>(ThreadMsgType::EXIT, nulldata);
 44 |         PostMsg(pMsg);
 45 |         // Wait for the thread to terminate, it is deleted automatically
 46 |         m_Thread->join();
 47 |     }
 48 |     catch (const std::exception&) { } // Swallow any exception.
 49 | }
 50 | 
 51 | template <template <typename HalVersion> class PreparedModel, typename HalVersion, typename CallbackContext>
 52 | void RequestThread_1_3<PreparedModel, HalVersion, CallbackContext>::PostMsg(PreparedModel<HalVersion>* model,
 53 |         std::shared_ptr<std::vector<::android::nn::RunTimePoolInfo>>& memPools,
 54 |         std::shared_ptr<armnn::InputTensors>& inputTensors,
 55 |         std::shared_ptr<armnn::OutputTensors>& outputTensors,
 56 |         CallbackContext callbackContext)
 57 | {
 58 |     ALOGV("RequestThread_1_3::PostMsg(...)");
 59 |     auto data = std::make_shared<AsyncExecuteData>(model,
 60 |                                                    memPools,
 61 |                                                    inputTensors,
 62 |                                                    outputTensors,
 63 |                                                    callbackContext);
 64 |     auto pMsg = std::make_shared<ThreadMsg>(ThreadMsgType::REQUEST, data);
 65 |     PostMsg(pMsg, model->GetModelPriority());
 66 | }
 67 | 
 68 | template <template <typename HalVersion> class PreparedModel, typename HalVersion, typename CallbackContext>
 69 | void RequestThread_1_3<PreparedModel, HalVersion, CallbackContext>::PostMsg(std::shared_ptr<ThreadMsg>& pMsg,
 70 |                                                                         V1_3::Priority priority)
 71 | {
 72 |     ALOGV("RequestThread_1_3::PostMsg(pMsg)");
 73 |     // Add a message to the queue and notify the request thread
 74 |     std::unique_lock<std::mutex> lock(m_Mutex);
 75 |     switch (priority) {
 76 |         case V1_3::Priority::HIGH:
 77 |             m_HighPriorityQueue.push(pMsg);
 78 |             break;
 79 |         case V1_3::Priority::LOW:
 80 |             m_LowPriorityQueue.push(pMsg);
 81 |             break;
 82 |         case V1_3::Priority::MEDIUM:
 83 |         default:
 84 |             m_MediumPriorityQueue.push(pMsg);
 85 |     }
 86 |     m_Cv.notify_one();
 87 | }
 88 | 
 89 | template <template <typename HalVersion> class PreparedModel, typename HalVersion, typename CallbackContext>
 90 | void RequestThread_1_3<PreparedModel, HalVersion, CallbackContext>::Process()
 91 | {
 92 |     ALOGV("RequestThread_1_3::Process()");
 93 |     int retireRate = RETIRE_RATE;
 94 |     int highPriorityCount = 0;
 95 |     int mediumPriorityCount = 0;
 96 |     while (true)
 97 |     {
 98 |         std::shared_ptr<ThreadMsg> pMsg(nullptr);
 99 |         {
100 |             // Wait for a message to be added to the queue
101 |             // This is in a separate scope to minimise the lifetime of the lock
102 |             std::unique_lock<std::mutex> lock(m_Mutex);
103 |             while (m_HighPriorityQueue.empty() && m_MediumPriorityQueue.empty() && m_LowPriorityQueue.empty())
104 |             {
105 |                 m_Cv.wait(lock);
106 |             }
107 |             // Get the message to process from the front of each queue based on priority from high to low
108 |             // Get high priority first if it does not exceed the retire rate
109 |             if (!m_HighPriorityQueue.empty() && highPriorityCount < retireRate)
110 |             {
111 |                 pMsg = m_HighPriorityQueue.front();
112 |                 m_HighPriorityQueue.pop();
113 |                 highPriorityCount += 1;
114 |             }
115 |             // If high priority queue is empty or the count exceeds the retire rate, get medium priority message
116 |             else if (!m_MediumPriorityQueue.empty() && mediumPriorityCount < retireRate)
117 |             {
118 |                 pMsg = m_MediumPriorityQueue.front();
119 |                 m_MediumPriorityQueue.pop();
120 |                 mediumPriorityCount += 1;
121 |                 // Reset high priority count
122 |                 highPriorityCount = 0;
123 |             }
124 |             // If medium priority queue is empty or the count exceeds the retire rate, get low priority message
125 |             else if (!m_LowPriorityQueue.empty())
126 |             {
127 |                 pMsg = m_LowPriorityQueue.front();
128 |                 m_LowPriorityQueue.pop();
129 |                 // Reset high and medium priority count
130 |                 highPriorityCount = 0;
131 |                 mediumPriorityCount = 0;
132 |             }
133 |             else
134 |             {
135 |                 // Reset high and medium priority count
136 |                 highPriorityCount = 0;
137 |                 mediumPriorityCount = 0;
138 |                 continue;
139 |             }
140 |         }
141 | 
142 |         switch (pMsg->type)
143 |         {
144 |             case ThreadMsgType::REQUEST:
145 |             {
146 |                 ALOGV("RequestThread_1_3::Process() - request");
147 |                 // invoke the asynchronous execution method
148 |                 PreparedModel<HalVersion>* model = pMsg->data->m_Model;
149 |                 model->ExecuteGraph(pMsg->data->m_MemPools,
150 |                                     *(pMsg->data->m_InputTensors),
151 |                                     *(pMsg->data->m_OutputTensors),
152 |                                     pMsg->data->m_CallbackContext);
153 |                 break;
154 |             }
155 | 
156 |             case ThreadMsgType::EXIT:
157 |             {
158 |                 ALOGV("RequestThread_1_3::Process() - exit");
159 |                 // delete all remaining messages (there should not be any)
160 |                 std::unique_lock<std::mutex> lock(m_Mutex);
161 |                 while (!m_HighPriorityQueue.empty())
162 |                 {
163 |                     m_HighPriorityQueue.pop();
164 |                 }
165 |                 while (!m_MediumPriorityQueue.empty())
166 |                 {
167 |                     m_MediumPriorityQueue.pop();
168 |                 }
169 |                 while (!m_LowPriorityQueue.empty())
170 |                 {
171 |                     m_LowPriorityQueue.pop();
172 |                 }
173 |                 return;
174 |             }
175 | 
176 |             default:
177 |                 // this should be unreachable
178 |                 throw armnn::RuntimeException("ArmNN: RequestThread_1_3: invalid message type");
179 |         }
180 |     }
181 | }
182 | 
183 | ///
184 | /// Class template specializations
185 | ///
186 | 
187 | template class RequestThread_1_3<ArmnnPreparedModel_1_3, hal_1_3::HalPolicy, CallbackContext_1_3>;
188 | 
189 | } // namespace armnn_driver
190 | 


--------------------------------------------------------------------------------
/RequestThread_1_3.hpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2020 Arm Ltd. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #pragma once
  7 | 
  8 | #include <queue>
  9 | #include <thread>
 10 | #include <mutex>
 11 | #include <condition_variable>
 12 | 
 13 | #include "ArmnnDriver.hpp"
 14 | #include "ArmnnDriverImpl.hpp"
 15 | 
 16 | #include <CpuExecutor.h>
 17 | #include <armnn/ArmNN.hpp>
 18 | 
 19 | namespace armnn_driver
 20 | {
 21 | using TimePoint = std::chrono::steady_clock::time_point;
 22 | 
 23 | template<template <typename HalVersion> class PreparedModel, typename HalVersion, typename CallbackContext>
 24 | class RequestThread_1_3
 25 | {
 26 | public:
 27 |     /// Constructor creates the thread
 28 |     RequestThread_1_3();
 29 | 
 30 |     /// Destructor terminates the thread
 31 |     ~RequestThread_1_3();
 32 | 
 33 |     /// Add a message to the thread queue.
 34 |     /// @param[in] model pointer to the prepared model handling the request
 35 |     /// @param[in] memPools pointer to the memory pools vector for the tensors
 36 |     /// @param[in] inputTensors pointer to the input tensors for the request
 37 |     /// @param[in] outputTensors pointer to the output tensors for the request
 38 |     /// @param[in] callback the android notification callback
 39 |     void PostMsg(PreparedModel<HalVersion>* model,
 40 |                  std::shared_ptr<std::vector<::android::nn::RunTimePoolInfo>>& memPools,
 41 |                  std::shared_ptr<armnn::InputTensors>& inputTensors,
 42 |                  std::shared_ptr<armnn::OutputTensors>& outputTensors,
 43 |                  CallbackContext callbackContext);
 44 | 
 45 | private:
 46 |     RequestThread_1_3(const RequestThread_1_3&) = delete;
 47 |     RequestThread_1_3& operator=(const RequestThread_1_3&) = delete;
 48 | 
 49 |     /// storage for a prepared model and args for the asyncExecute call
 50 |     struct AsyncExecuteData
 51 |     {
 52 |         AsyncExecuteData(PreparedModel<HalVersion>* model,
 53 |                          std::shared_ptr<std::vector<::android::nn::RunTimePoolInfo>>& memPools,
 54 |                          std::shared_ptr<armnn::InputTensors>& inputTensors,
 55 |                          std::shared_ptr<armnn::OutputTensors>& outputTensors,
 56 |                          CallbackContext callbackContext)
 57 |             : m_Model(model)
 58 |             , m_MemPools(memPools)
 59 |             , m_InputTensors(inputTensors)
 60 |             , m_OutputTensors(outputTensors)
 61 |             , m_CallbackContext(callbackContext)
 62 |         {
 63 |         }
 64 | 
 65 |         PreparedModel<HalVersion>* m_Model;
 66 |         std::shared_ptr<std::vector<::android::nn::RunTimePoolInfo>> m_MemPools;
 67 |         std::shared_ptr<armnn::InputTensors> m_InputTensors;
 68 |         std::shared_ptr<armnn::OutputTensors> m_OutputTensors;
 69 |         CallbackContext m_CallbackContext;
 70 |     };
 71 |     enum class ThreadMsgType
 72 |     {
 73 |         EXIT,                   // exit the thread
 74 |         REQUEST                 // user request to process
 75 |     };
 76 | 
 77 |     /// storage for the thread message type and data
 78 |     struct ThreadMsg
 79 |     {
 80 |         ThreadMsg(ThreadMsgType msgType,
 81 |                   std::shared_ptr<AsyncExecuteData>& msgData)
 82 |             : type(msgType)
 83 |             , data(msgData)
 84 |         {
 85 |         }
 86 | 
 87 |         ThreadMsgType type;
 88 |         std::shared_ptr<AsyncExecuteData> data;
 89 |     };
 90 | 
 91 |     /// Add a prepared thread message to the thread queue.
 92 |     /// @param[in] threadMsg the message to add to the queue
 93 |     void PostMsg(std::shared_ptr<ThreadMsg>& pThreadMsg, V1_3::Priority priority = V1_3::Priority::MEDIUM);
 94 | 
 95 |     /// Entry point for the request thread
 96 |     void Process();
 97 | 
 98 |     std::unique_ptr<std::thread> m_Thread;
 99 |     std::queue<std::shared_ptr<ThreadMsg>> m_HighPriorityQueue;
100 |     std::queue<std::shared_ptr<ThreadMsg>> m_MediumPriorityQueue;
101 |     std::queue<std::shared_ptr<ThreadMsg>> m_LowPriorityQueue;
102 |     std::mutex m_Mutex;
103 |     std::condition_variable m_Cv;
104 | };
105 | 
106 | } // namespace armnn_driver
107 | 


--------------------------------------------------------------------------------
/SECURITY.md:
--------------------------------------------------------------------------------
 1 | **Reporting vulnerabilities**
 2 | 
 3 | Arm takes security issues seriously and welcomes feedback from researchers and the security community in order to improve the security of its products and services. We operate a coordinated disclosure policy for disclosing vulnerabilities and other security issues.
 4 | 
 5 | Security issues can be complex and one single timescale doesn't fit all circumstances. We will make best endeavours to inform you when we expect security notifications and fixes to be available and facilitate coordinated disclosure when notifications and patches/mitigations are available.
 6 | 
 7 | **Report**
 8 | 
 9 | For all security issues, contact Arm by email at [arm-security@arm.com](mailto:arm-security@arm.com).
10 | 
11 | **Secure submission using PGP**
12 | 
13 | We support and encourage secure submission of vulnerability reports using PGP, using the key below. If you would like replies to be encrypted, please provide your own public key through a secure mechanism.
14 | 
15 | ~~~
16 | -----BEGIN PGP PUBLIC KEY BLOCK-----
17 | mQINBFr7/RMBEACjHR5QZL/z1t2aLCRNXLE4KJiQmCo7edU5Be+7MTjIJDzZNu68
18 | lNEUYRoLexeayif8eC4T19bUsSbGpxHiYsFFjV8ewLXDyDJRRuaBGPfQ5rn/mE6X
19 | Nvu+9Pputr+mB1R3CXcvrNkhmzPkK7zVM15oeyBMhogqPssuT4OeMduQdip8smfK
20 | xTMk91RrJTLb+G3eE1tf+81kXBYvzp2e24Sn0/VeYe0IWnBobjVBZk3TmcYxDvz5
21 | Y47fU9V6cNj3Zq4VYrgxuLoFCA2VtetyiFQm5IYa3Bt3SWcAwihr8nbR2HoNdWyA
22 | u8wJYYVzSq3hvT5l/IjTHxEcY+6RBq8poDSsftzvX386u9hmw7sJQFlTw6/pUjdr
23 | gbsZ2ZzRBzKtU17ercpn4kU6VgVP3WRB5HiTFFkEpZuqAznOYaHbMq4dfd/g7Quq
24 | C0VTbWiJnhku2i+g4BdHHRDtIF6U3aVQAfbrDb1LjVTa65p5ULOeY3HRAWtMNtu/
25 | Cj8cD98JDanzXtcnisds8vMQ8LZ6iMFChEnF8K4V0eLw9Ju6CMNiFYY7SEBndD/H
26 | M4KcU4li7mROSbJcshgEbe1SYkxdMuI9eY4DNYxl3VjxoPUGzeqXo/ADFKE9bHsi
27 | GTyEoij4ku0HspLVKnYHXn/LqHGwEcwjF8zphS+w5cn/e01akYwz5EVSQwARAQAB
28 | tB1Bcm0gU3VwcG9ydCA8c3VwcG9ydEBhcm0uY29tPokCTgQTAQgAOBYhBN9zqDwZ
29 | RL/vF0ihcdfNKdz4bBRiBQJa+/0TAhsDBQsJCAcCBhUKCQgLAgQWAgMBAh4BAheA
30 | AAoJENfNKdz4bBRibK0P/jLlJR/QYypcjb+8BnHT9tCDgcV2KFYXS15VpbSNviN9
31 | Xs/UOnSadoGUMGCXDyb1PRNn98yUn7JlNR9rtsqPRmkpbo5cuw46ehgxjVlfcHnk
32 | CttaE8Davx6zo0fyrBib2+oVVW8usi9+uRK4vhhPUicO3oXwzldsVFz+RbpubZxc
33 | Bg/CZ+dQ2jMKOv1zDtInOG6OBnbQZRAeiWXgGhcIoPZ4zBQOi8nr0+bLcfvMeZi2
34 | uz6uKnylpXwZbl4ijcG8MKV/ei+7du+SzA9NY0WOT2g3FXDREWUhjKs8bmEZgIx4
35 | QgvDNpxAUThF+TqQ7zrsA8nT8POvDD0MhN/Z+A3QdPTdcaZFaXzIdxbDg+0FKmzu
36 | OgtQBH4C01RWrkmZlhO5w7/Qjt0vLlhfyQIL9BW/HeEPtjnH2Hnq8xYnZhlVqJEh
37 | FJU7F9sMvyiJiKviobFTd6AmpVkhxhcJ3k2L2C03imTsmUwAoejQCXwiYcOhyQ2t
38 | Z9Nk8YIZTEw2urGFi4HSQPwPq2j/2j7ABJ4rlzJvO6vs5ppGkumvzIIP9JnpVXbp
39 | wcbK6Ev6KdkX4s14Mzd6Hsd8LpL8t5nHhxUey6G0xKe2eSlHVm5Mlfhoete9UmIZ
40 | dzIOZkgTgWXlYXRIxwGQ2Pss7pURtofykvLklq4jcobQuHxurl9cteodETfbWk/J
41 | uQINBFr7/RMBEADWZG8eqt5D22g3T7ehnH/T3fuTX8LPUBnODMWGAEUY8uv64To8
42 | 46odvrXFgWBgCf0sROEyJchc3SGLyR9S4lJsVJRde3QLN3WZkHlB4pSn4IQHFyQd
43 | wsLQi+S9uggHMPlQ6MNvc5n0P3k5bT9fLUmtJWJ3QVjW7k963ZXpzf1zbQJqs30w
44 | rlqGUZllfRoYQTfcYxFEaUFhwRJ//skNImWH8Vz+PTnqg2zRtFn3usrBV4GpNvsM
45 | 6jy+YEsSvUa7IY8k4wpPzEhIfqDjGbZxFSQ1H1G+mLUL+DD7oGffej/ZoC86TIdM
46 | p6ew1rGhJdQBLh9nx+1ADOLWjNo2R0h60u7VR5q/K6V4fwWmeGFipPXZCD92I+nR
47 | t/cjznwNyD/6J9YrBMF7mbGrS1TyfLaLt4tpdcBnsgqDTodd5OmG65mroXsg/lNO
48 | 7YZdecLZ34krfaLrWTtKkqULXbppB+uQvbVj8p8ONRImn6bZ+iAhnNaH9wJ06ico
49 | b1F0imJ2SJWnFr6PzPRr0gPStLgu9wrRKheaORwF/H/HxSyPZxNVxFqu81q518A/
50 | plhub9INQLaxHf/TTjXpqZCcfdNTYUAW8rwbQfW9doSIT4lHY8bJXktb6BsVjkFj
51 | PzDeYpXeOoTWetQqsEuTdg/F+qg041QBLtNj9Lr3Vy3StgMciRUIP8m0XwARAQAB
52 | iQI2BBgBCAAgFiEE33OoPBlEv+8XSKFx180p3PhsFGIFAlr7/RMCGwwACgkQ180p
53 | 3PhsFGLWMA//V/XKrnI2YBh/SptUrgg7knPXva45bb7tGSH1fJg8f/wqycOSFFCY
54 | ES45boA5jlQ3z8uw6BYCz5KeOucGhxAMw+x5EDdxZ33ksY5zqXB35WaMXzEwGYYb
55 | E113/yhOsTbzu4bBKABSXbJO98MdAWvWpyCpp2MHIR3S9+ycM7/FMZ5xi3czZNRg
56 | 9+WZP+7W4qWhJptQ0kBh5C3N/tiltju5WQ2Y7XIn+5dMOJdtseFS7CNerxXZGAtH
57 | nfRxaD/4ENdbWOwaVJiVW7+ioUJz09OWgy0gLYSDW+hciDnW1QAaJLpdAbniGZ0S
58 | JsTmaZla8JnUKqZPgbFfA2OcnH9H+DWc0pHv17c5tJzTMP7rgirgGRX/U2LOzmFZ
59 | 1UxjQj5nn3Oa5frXbIAzb8xKiR0VDaquCM/3sti1AesYiS0Gw0Sqnw8qpFypgFXN
60 | CKVgYXppIT+TmbDbNJDOB2UycxeI4vbiBwU8fI4qSpW12WsGdAJt/rx3UsyhZ+02
61 | 4aSqDHzhJmtDPQ6lnaKe1fUkC90tgp8loVGmriWQx82jAQMqATVjIklTpE4vm00f
62 | ocQIWOKEE90mKNEoV6rNbfl5QevmapTVdV/pmrRBzhbsa1uAUS4HZdH0Nf/OXEyv
63 | yYCr2gCFPymkkRYhPr2w5EgbWyzLaBIwqjyIbXaveuB3DYi2Lhbf64I=
64 | =EaN7
65 | -----END PGP PUBLIC KEY BLOCK-----
66 | ~~~
67 | 
68 | For more information visit https://developer.arm.com/support/arm-security-updates/report-security-vulnerabilities
69 | 


--------------------------------------------------------------------------------
/SECURITY.md.license:
--------------------------------------------------------------------------------
1 | #
2 | # Copyright © 2020 Arm Ltd and Contributors. All rights reserved.
3 | # SPDX-License-Identifier: MIT
4 | #
5 | 


--------------------------------------------------------------------------------
/SystemPropertiesUtils.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #pragma once
 7 | 
 8 | #include <stdio.h>
 9 | #include <string>
10 | #include <iostream>
11 | #include <sys/system_properties.h>
12 | #include <log/log.h>
13 | 
14 | namespace {
15 | template<typename T>
16 | struct ConvStringTo;
17 | 
18 | template<>
19 | struct ConvStringTo<float>
20 | {
21 |     static float Func(std::string s) { return std::stof(s); }
22 | };
23 | 
24 | template<>
25 | struct ConvStringTo<int>
26 | {
27 |     static int Func(std::string s) { return std::stoi(s); }
28 | };
29 | 
30 | template<>
31 | struct ConvStringTo<bool>
32 | {
33 |     static bool Func(std::string s) { return !!std::stoi(s); }
34 | };
35 | 
36 | template<typename T>
37 | void GetCapabilitiesProperties([[maybe_unused]]void* cookie,
38 |                                [[maybe_unused]]const char *name,
39 |                                [[maybe_unused]]const char *value,
40 |                                [[maybe_unused]]uint32_t serial)
41 | {
42 |     T &prop = *reinterpret_cast<T*>(cookie);
43 |     prop = ConvStringTo<T>::Func(std::string(value));
44 | }
45 | 
46 | template<typename T>
47 | T ParseSystemProperty(const char* name, T defaultValue)
48 | {
49 |     try
50 |     {
51 |         const prop_info *pInfo = __system_property_find(name);
52 |         if (!pInfo)
53 |         {
54 |             ALOGW("ArmnnDriver::ParseSystemProperty(): Could not find property [%s].", name);
55 |         } else
56 |         {
57 |             T property;
58 |             __system_property_read_callback(pInfo, &GetCapabilitiesProperties<T>, &property);
59 |             std::stringstream messageBuilder;
60 |             messageBuilder << "ArmnnDriver::ParseSystemProperty(): Setting [" << name << "]=[" << property << "].";
61 |             ALOGD("%s", messageBuilder.str().c_str());
62 |             return property;
63 |         }
64 |     }
65 |     catch(const std::invalid_argument& e)
66 |     {
67 |         ALOGD("ArmnnDriver::ParseSystemProperty(): Property [%s] has invalid data type.", name);
68 |     }
69 |     catch(const std::out_of_range& e)
70 |     {
71 |         ALOGD("ArmnnDriver::ParseSystemProperty(): Property [%s] out of range for the data type.", name);
72 |     }
73 |     catch (...)
74 |     {
75 |         ALOGD("ArmnnDriver::ParseSystemProperty(): Unexpected exception reading system "
76 |             "property [%s].", name);
77 |     }
78 | 
79 |     std::stringstream messageBuilder;
80 |     messageBuilder << "ArmnnDriver::ParseSystemProperty(): Falling back to default value [" << defaultValue << "]";
81 |     ALOGD("%s", messageBuilder.str().c_str());
82 |     return defaultValue;
83 | }
84 | } //namespace
85 | 


--------------------------------------------------------------------------------
/Utils.hpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2017-2021,2023 Arm Ltd and Contributors. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #pragma once
  7 | #include <armnn/ArmNN.hpp>
  8 | 
  9 | #include <CpuExecutor.h>
 10 | #include <HalInterfaces.h>
 11 | #include <NeuralNetworks.h>
 12 | #include <Utils.h>
 13 | 
 14 | #include <fmt/format.h>
 15 | 
 16 | #include <vector>
 17 | #include <string>
 18 | #include <fstream>
 19 | #include <iomanip>
 20 | 
 21 | namespace V1_0 = ::android::hardware::neuralnetworks::V1_0;
 22 | namespace V1_1 = ::android::hardware::neuralnetworks::V1_1;
 23 | 
 24 | #if defined(ARMNN_ANDROID_NN_V1_2) || defined(ARMNN_ANDROID_NN_V1_3)
 25 | namespace V1_2 = ::android::hardware::neuralnetworks::V1_2;
 26 | #endif
 27 | 
 28 | #ifdef ARMNN_ANDROID_NN_V1_3
 29 | namespace V1_3 = ::android::hardware::neuralnetworks::V1_3;
 30 | #endif
 31 | 
 32 | namespace armnn_driver
 33 | {
 34 | 
 35 | #ifdef ARMNN_ANDROID_R
 36 | using DataLocation = ::android::nn::hal::DataLocation;
 37 | #endif
 38 | 
 39 | inline const V1_0::Model&    getMainModel(const V1_0::Model& model) { return model; }
 40 | inline const V1_1::Model&    getMainModel(const V1_1::Model& model) { return model; }
 41 | 
 42 | #if defined (ARMNN_ANDROID_NN_V1_2) || defined (ARMNN_ANDROID_NN_V1_3)
 43 | inline const V1_2::Model&    getMainModel(const V1_2::Model& model) { return model; }
 44 | #endif
 45 | 
 46 | #ifdef ARMNN_ANDROID_NN_V1_3
 47 | inline const V1_3::Subgraph& getMainModel(const V1_3::Model& model) { return model.main; }
 48 | #endif
 49 | 
 50 | extern const armnn::PermutationVector g_DontPermute;
 51 | 
 52 | template <typename OperandType>
 53 | class UnsupportedOperand: public std::runtime_error
 54 | {
 55 | public:
 56 |     UnsupportedOperand(const OperandType type)
 57 |         : std::runtime_error("Operand type is unsupported")
 58 |         , m_type(type)
 59 |     {}
 60 | 
 61 |     OperandType m_type;
 62 | };
 63 | 
 64 | /// Swizzles tensor data in @a input according to the dimension mappings.
 65 | void SwizzleAndroidNn4dTensorToArmNn(armnn::TensorInfo& tensor, const void* input, void* output,
 66 |                                      const armnn::PermutationVector& mappings);
 67 | 
 68 | /// Returns a pointer to a specific location in a pool
 69 | void* GetMemoryFromPool(V1_0::DataLocation location,
 70 |                         const std::vector<android::nn::RunTimePoolInfo>& memPools);
 71 | 
 72 | /// Can throw UnsupportedOperand
 73 | armnn::TensorInfo GetTensorInfoForOperand(const V1_0::Operand& operand);
 74 | 
 75 | std::string GetOperandSummary(const V1_0::Operand& operand);
 76 | 
 77 | // Returns true for any quantized data type, false for the rest.
 78 | bool isQuantizedOperand(const V1_0::OperandType& operandType);
 79 | 
 80 | #if defined(ARMNN_ANDROID_NN_V1_2) || defined(ARMNN_ANDROID_NN_V1_3) // Using ::android::hardware::neuralnetworks::V1_2
 81 | armnn::TensorInfo GetTensorInfoForOperand(const V1_2::Operand& operand);
 82 | 
 83 | std::string GetOperandSummary(const V1_2::Operand& operand);
 84 | 
 85 | bool isQuantizedOperand(const V1_2::OperandType& operandType);
 86 | #endif
 87 | 
 88 | #ifdef ARMNN_ANDROID_NN_V1_3 // Using ::android::hardware::neuralnetworks::V1_3
 89 | armnn::TensorInfo GetTensorInfoForOperand(const V1_3::Operand& operand);
 90 | 
 91 | std::string GetOperandSummary(const V1_3::Operand& operand);
 92 | 
 93 | bool isQuantizedOperand(const V1_3::OperandType& operandType);
 94 | #endif
 95 | 
 96 | template <typename HalModel>
 97 | std::string GetModelSummary(const HalModel& model)
 98 | {
 99 |     std::stringstream result;
100 | 
101 |     result << getMainModel(model).inputIndexes.size() << " input(s), "
102 |            << getMainModel(model).operations.size() << " operation(s), "
103 |            << getMainModel(model).outputIndexes.size() << " output(s), "
104 |            << getMainModel(model).operands.size() << " operand(s) "
105 |            << std::endl;
106 | 
107 |     result << "Inputs: ";
108 |     for (uint32_t i = 0; i < getMainModel(model).inputIndexes.size(); i++)
109 |     {
110 |         result << GetOperandSummary(getMainModel(model).operands[getMainModel(model).inputIndexes[i]]) << ", ";
111 |     }
112 |     result << std::endl;
113 | 
114 |     result << "Operations: ";
115 |     for (uint32_t i = 0; i < getMainModel(model).operations.size(); i++)
116 |     {
117 |         result << toString(getMainModel(model).operations[i].type).c_str() << ", ";
118 |     }
119 |     result << std::endl;
120 | 
121 |     result << "Outputs: ";
122 |     for (uint32_t i = 0; i < getMainModel(model).outputIndexes.size(); i++)
123 |     {
124 |         result << GetOperandSummary(getMainModel(model).operands[getMainModel(model).outputIndexes[i]]) << ", ";
125 |     }
126 |     result << std::endl;
127 | 
128 |     return result.str();
129 | }
130 | 
131 | template <typename TensorType>
132 | void DumpTensor(const std::string& dumpDir,
133 |                 const std::string& requestName,
134 |                 const std::string& tensorName,
135 |                 const TensorType& tensor);
136 | 
137 | void DumpJsonProfilingIfRequired(bool gpuProfilingEnabled,
138 |                                  const std::string& dumpDir,
139 |                                  armnn::NetworkId networkId,
140 |                                  const armnn::IProfiler* profiler);
141 | 
142 | std::string ExportNetworkGraphToDotFile(const armnn::IOptimizedNetwork& optimizedNetwork,
143 |                                         const std::string& dumpDir);
144 | 
145 | std::string SerializeNetwork(const armnn::INetwork& network,
146 |                              const std::string& dumpDir,
147 |                              std::vector<uint8_t>& dataCacheData,
148 |                              bool dataCachingActive = true);
149 | 
150 | void RenameExportedFiles(const std::string& existingSerializedFileName,
151 |                          const std::string& existingDotFileName,
152 |                          const std::string& dumpDir,
153 |                          const armnn::NetworkId networkId);
154 | 
155 | void RenameFile(const std::string& existingName,
156 |                 const std::string& extension,
157 |                 const std::string& dumpDir,
158 |                 const armnn::NetworkId networkId);
159 | 
160 | /// Checks if a tensor info represents a dynamic tensor
161 | bool IsDynamicTensor(const armnn::TensorInfo& outputInfo);
162 | 
163 | /// Checks for ArmNN support of dynamic tensors.
164 | bool AreDynamicTensorsSupported(void);
165 | 
166 | std::string GetFileTimestamp();
167 | 
168 | #if defined(ARMNN_ANDROID_NN_V1_2) || defined(ARMNN_ANDROID_NN_V1_3)
169 | inline V1_2::OutputShape ComputeShape(const armnn::TensorInfo& info)
170 | {
171 |     V1_2::OutputShape shape;
172 | 
173 |     armnn::TensorShape tensorShape = info.GetShape();
174 |     // Android will expect scalars as a zero dimensional tensor
175 |     if(tensorShape.GetDimensionality() == armnn::Dimensionality::Scalar)
176 |     {
177 |          shape.dimensions = android::hardware::hidl_vec<uint32_t>{};
178 |     }
179 |     else
180 |     {
181 |         android::hardware::hidl_vec<uint32_t> dimensions;
182 |         const unsigned int numDims = tensorShape.GetNumDimensions();
183 |         dimensions.resize(numDims);
184 |         for (unsigned int outputIdx = 0u; outputIdx < numDims; ++outputIdx)
185 |         {
186 |             dimensions[outputIdx] = tensorShape[outputIdx];
187 |         }
188 |         shape.dimensions = dimensions;
189 |     }
190 | 
191 |     shape.isSufficient = true;
192 | 
193 |     return shape;
194 | }
195 | #endif
196 | 
197 | void CommitPools(std::vector<::android::nn::RunTimePoolInfo>& memPools);
198 | 
199 | template <typename ErrorStatus, typename Request>
200 | ErrorStatus ValidateRequestArgument(const Request& request,
201 |                                     const armnn::TensorInfo& tensorInfo,
202 |                                     const V1_0::RequestArgument& requestArgument,
203 |                                     std::string descString);
204 | } // namespace armnn_driver
205 | 


--------------------------------------------------------------------------------
/android.hardware.neuralnetworks@1.0-service-armnn.rc:
--------------------------------------------------------------------------------
1 | service neuralnetworks_hal_service_armnn /vendor/bin/hw/android.hardware.neuralnetworks@1.0-service-armnn
2 |     class hal
3 |     user system
4 |     group system
5 | 


--------------------------------------------------------------------------------
/android.hardware.neuralnetworks@1.0-service-armnn.rc.license:
--------------------------------------------------------------------------------
1 | #
2 | # Copyright © 2018, 2020 Arm Ltd and Contributors. All rights reserved.
3 | # SPDX-License-Identifier: MIT
4 | #
5 | 


--------------------------------------------------------------------------------
/android.hardware.neuralnetworks@1.1-service-armnn.rc:
--------------------------------------------------------------------------------
1 | service neuralnetworks_hal_service_armnn /vendor/bin/hw/android.hardware.neuralnetworks@1.1-service-armnn
2 |     class hal
3 |     user system
4 |     group system
5 | 


--------------------------------------------------------------------------------
/android.hardware.neuralnetworks@1.1-service-armnn.rc.license:
--------------------------------------------------------------------------------
1 | #
2 | # Copyright © 2018, 2020 Arm Ltd and Contributors. All rights reserved.
3 | # SPDX-License-Identifier: MIT
4 | #
5 | 


--------------------------------------------------------------------------------
/android.hardware.neuralnetworks@1.2-service-armnn.rc:
--------------------------------------------------------------------------------
1 | service neuralnetworks_hal_service_armnn /vendor/bin/hw/android.hardware.neuralnetworks@1.2-service-armnn
2 |     class hal
3 |     user system
4 |     group system
5 | 


--------------------------------------------------------------------------------
/android.hardware.neuralnetworks@1.2-service-armnn.rc.license:
--------------------------------------------------------------------------------
1 | #
2 | # Copyright © 2019-2020 Arm Ltd and Contributors. All rights reserved.
3 | # SPDX-License-Identifier: MIT
4 | #
5 | 


--------------------------------------------------------------------------------
/android.hardware.neuralnetworks@1.3-service-armnn.rc:
--------------------------------------------------------------------------------
1 | service neuralnetworks_hal_service_armnn /vendor/bin/hw/android.hardware.neuralnetworks@1.3-service-armnn
2 |     class hal
3 |     user system
4 |     group system
5 | 


--------------------------------------------------------------------------------
/android.hardware.neuralnetworks@1.3-service-armnn.rc.license:
--------------------------------------------------------------------------------
1 | #
2 | # Copyright © 2020 Arm Ltd and Contributors. All rights reserved.
3 | # SPDX-License-Identifier: MIT
4 | #
5 | 


--------------------------------------------------------------------------------
/docs/FAQ.md:
--------------------------------------------------------------------------------
 1 | Frequently asked questions
 2 | ==========================
 3 | 
 4 | These are issues that have been seen when using the Arm NN Android NNAPI driver. The guidance here could be of interest to Android system integrators including the driver in an Android platform.
 5 | 
 6 | Problems seen when running VTS tests through vts-tradefed
 7 | ---------------------------------------------------------
 8 | 
 9 | An issue has been seen in some systems when running the NNAPI VTS tests using vts-tradefed, in a system configured to use the Arm NN GPU backend.
10 | When the total time taken to run all tests in a suite exceeds the timeout defined for the plan, an error is supposed to be reported through vts-tradefed. However,
11 | some users have seen a situation where the device side of the tests gets killed, and the vts-tradefed console continues to run and reports that all further
12 | tests "Fail". In this case the "Failed" tests are actually not being executed.
13 | 
14 | This has been seen when running large test suites using the Arm NN GPU backend (Mali OpenCL) as the time needed to compile hundreds or thousands of OpenCL kernels
15 | was not taken into account when setting an appropriate test timeout for Android 8.1 and Android 9.0. This issue was fixed in the AOSP master branch in change
16 | https://android.googlesource.com/platform/test/vts-testcase/hal/+/f74899c6c09b52703e6db0323dffb4ae52539db4 so should not be seen in Android 10 or later.
17 | 
18 | An acceptable workaround is to increase the timeout defined in AndroidTest.xml, in a similar way to https://android.googlesource.com/platform/test/vts-testcase/hal/+/f74899c6c09b52703e6db0323dffb4ae52539db4.
19 | 
20 | Instance Normalization test failures 
21 | ------------------------------------
22 | 
23 | There is a known issue in the Android NNAPI implementation of Instance Normalization that has been verified as fixed from Android 10 r39 onwards. Using the Arm NN Android NNAPI driver with versions of the Android 10 VTS and CTS tests that do not have that fix will generate multiple Instance Normalization test failures. 
24 | 
25 | VTS and CTS test failures
26 | -------------------------
27 | 
28 | With Android 10 R2 CTS some errors and crashes were discovered in the 19.08 and 19.11 releases of armnn, the android-nn-driver and ComputeLibrary. 19.08.01 and 19.11.01 releases of armnn, the android-nn-driver and ComputeLibrary were prepared that fix all these issues on CpuAcc and GpuAcc. If using 19.08 or 19.11 we recommend that you upgrade to the latest releases.
29 | 
30 | These fixes also required patches to be made to the Android Q test framework. You may encounter CTS and VTS test failures when attempting to build copies of the android-nn-driver against older versions of Android Q.
31 | 
32 | These test failures include:
33 | 
34 | * ComputeMode/GeneratedTests.avg_pool_v1_2 Float16 tests 
35 | * ComputeMode/GeneratedTests.instance_normalization tests
36 | * TestRandomGraph/SingleOperationTest.INSTANCE_NORMALIZATION_V1_2 tests
37 | * TestRandomGraph/SingleOperationTest.PRELU_V1_2 tests
38 | * Some TestRandomGraph/RandomGraphTest tests which include avg_pool or instance_normalization operators.
39 | * Some TestRandomGraph/RandomGraphTest tests which use Float16 input.
40 | 
41 | In order to fix these failures you will have to update to a version of Android Q that includes the following patches: https://android-review.googlesource.com/q/project:platform%252Fframeworks%252Fml+branch:android10-tests-dev+status:merged
42 | 
43 | The Android 10 R3 CTS that can be downloaded from https://source.android.com/compatibility/cts/downloads contains all these patches. 
44 | 
45 | There is a known issue that even with these patches CTS tests "TestRandomGraph/RandomGraphTest#LargeGraph_TENSOR_FLOAT16_Rank3/41" and "TestRandomGraph/RandomGraphTest#LargeGraph_TENSOR_FLOAT16_Rank2/20 " will still fail on CpuRef. These failures are caused by a LogSoftmax layer followed by a Floor layer which blows up the slight difference between fp16 to fp32. This issue only affects CpuRef with Android Q. These tests are not failing for Android R.
46 | 


--------------------------------------------------------------------------------
/docs/FAQ.md.license:
--------------------------------------------------------------------------------
1 | #
2 | # Copyright © 2019-2022 Arm Ltd and Contributors. All rights reserved.
3 | # SPDX-License-Identifier: MIT
4 | #
5 | 


--------------------------------------------------------------------------------
/docs/IntegratorGuide.md.license:
--------------------------------------------------------------------------------
1 | #
2 | # Copyright © 2019-2022 Arm Ltd and Contributors. All rights reserved.
3 | # SPDX-License-Identifier: MIT
4 | #
5 | 


--------------------------------------------------------------------------------
/service.cpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #define LOG_TAG "ArmnnDriver"
 7 | 
 8 | #include "ArmnnDriver.hpp"
 9 | 
10 | #include <hidl/LegacySupport.h>
11 | #include <log/log.h>
12 | 
13 | #include <string>
14 | 
15 | using namespace armnn_driver;
16 | using namespace std;
17 | 
18 | int main(int argc, char** argv)
19 | {
20 |     android::sp<ArmnnDriver> driver;
21 |     DriverOptions driverOptions(argc, argv);
22 | 
23 |     if (driverOptions.ShouldExit())
24 |     {
25 |         return driverOptions.GetExitCode();
26 |     }
27 |     try
28 |     {
29 |         driver = new ArmnnDriver(DriverOptions(argc, argv));
30 |     }
31 |     catch (const std::exception& e)
32 |     {
33 |         ALOGE("Could not create driver: %s", e.what());
34 |         std::cout << "Unable to start:" << std::endl
35 |                   << "Could not create driver: " << e.what() << std::endl;
36 |         return EXIT_FAILURE;
37 |     }
38 | 
39 |     android::hardware::configureRpcThreadpool(1, true);
40 |     android::status_t status = android::UNKNOWN_ERROR;
41 |     try
42 |     {
43 |         status = driver->registerAsService(driverOptions.GetServiceName());
44 |     }
45 |     catch (const std::exception& e)
46 |     {
47 |         ALOGE("Could not register service: %s", e.what());
48 |         std::cout << "Unable to start:" << std::endl
49 |                   << "Could not register service: " << e.what() << std::endl;
50 |         return EXIT_FAILURE;
51 |     }
52 | 
53 |     if (status != android::OK)
54 |     {
55 |         ALOGE("Could not register service");
56 |         std::cout << "Unable to start:" << std::endl
57 |                   << "Could not register service" << std::endl;
58 |         return EXIT_FAILURE;
59 |     }
60 |     android::hardware::joinRpcThreadpool();
61 |     ALOGW("Service exited!");
62 |     return EXIT_SUCCESS;
63 | }
64 | 


--------------------------------------------------------------------------------
/setup.sh:
--------------------------------------------------------------------------------
  1 | #!/bin/bash
  2 | 
  3 | #
  4 | # Copyright © 2018,2020-2024 Arm Ltd and Contributors. All rights reserved.
  5 | # SPDX-License-Identifier: MIT
  6 | #
  7 | 
  8 | function AssertZeroExitCode {
  9 |   EXITCODE=$?
 10 |   if [ $EXITCODE -ne 0 ]; then
 11 |     echo "$1"
 12 |     echo "+++ Command exited with code $EXITCODE. Please fix the above errors and re-run"
 13 |     exit 1
 14 |   fi
 15 | }
 16 | 
 17 | BUILD_DIR=build-x86_64
 18 | FLATBUFFERS_DIR=$PWD/flatbuffers
 19 | CMAKE_DIR=$PWD/cmake-3.22.1
 20 | 
 21 | function BuildCmake {
 22 |   CMAKE_VERSION=3.22.1
 23 |   CMAKE_DIST="cmake-3.22.1"
 24 |   # Note that the Cmake version with and without the patch release are used in this URL.
 25 |   CMAKE_URL="https://cmake.org/files/v3.22/${CMAKE_DIST}.tar.gz"
 26 |   CMAKE_ZIP=$PWD/${CMAKE_DIST}.tar.gz
 27 |   CMAKE_PKG=$PWD/${CMAKE_DIST}
 28 | 
 29 |   # If the correct package doesn't exist then download and unpack it.
 30 |   if [[ ! -d "$CMAKE_PKG" ]]; then
 31 |       # Download the version of CMake we want
 32 |       echo "+++ Downloading CMake"
 33 |       mkdir -p cmake
 34 |       wget -O $CMAKE_ZIP $CMAKE_URL
 35 |       AssertZeroExitCode "Downloading CMake failed"
 36 |       echo "+++ Unpacking CMake"
 37 |       tar -xzf "$CMAKE_ZIP" -C "$PWD"
 38 |       AssertZeroExitCode "Unpacking CMake failed"
 39 |   fi
 40 |   # This version of cmake will be used in devenv only.
 41 |   echo "+++ Building CMake"
 42 |   cd "$CMAKE_PKG" || exit 1
 43 |   ./bootstrap --prefix=$PWD/${CMAKE_DIST}/ || exit 1
 44 |   make || exit 1
 45 |   make install || exit 1
 46 |   echo "+++ CMake Successfully Installed in $PWD/${CMAKE_DIST}/"
 47 |   cd ..
 48 | }
 49 | 
 50 | function BuildFlatbuffers {
 51 |   pushd flatbuffers
 52 |   rm -rf $BUILD_DIR
 53 |   rm -f CMakeCache.txt
 54 |   FLATBUFFERS_DIR=$PWD
 55 | 
 56 |   mkdir -p $BUILD_DIR
 57 |   cd $BUILD_DIR
 58 | 
 59 |   echo "+++ Building Google Flatbufers"
 60 |   CMD="${CMAKE_DIR}/bin/cmake -DFLATBUFFERS_BUILD_FLATC=1 -DCMAKE_INSTALL_PREFIX:PATH=$FLATBUFFERS_DIR .."
 61 |   # Force -fPIC to allow relocatable linking.
 62 |   CXXFLAGS="-fPIC" $CMD
 63 |   AssertZeroExitCode "cmake Google Flatbuffers failed. command was: ${CMD}"
 64 |   make all install
 65 |   AssertZeroExitCode "Building Google Flatbuffers failed"
 66 |   mkdir -p $FLATBUFFERS_DIR/bin
 67 |   cp -f flatc $FLATBUFFERS_DIR/bin
 68 |   AssertZeroExitCode "Failed to copy the Flatbuffers Compiler"
 69 |   popd
 70 | }
 71 | 
 72 | if [ ! -d flatbuffers ]; then
 73 |   echo "++ Downloading FlatBuffers v23.5.26"
 74 | 
 75 |   FLATBUFFERS_PKG=v23.5.26.tar.gz
 76 | 
 77 |   curl -LOk https://github.com/google/flatbuffers/archive/${FLATBUFFERS_PKG}
 78 |   AssertZeroExitCode "Downloading FlatBuffers failed"
 79 |   mkdir -p flatbuffers
 80 |   tar xzf $FLATBUFFERS_PKG -C flatbuffers --strip-components 1
 81 |   AssertZeroExitCode "Unpacking FlatBuffers failed"
 82 | 
 83 |   BuildCmake
 84 |   BuildFlatbuffers
 85 | 
 86 |   rm -rf $FLATBUFFERS_PKG
 87 | fi
 88 | 
 89 | if [ ! -d armnn ]; then
 90 |   echo "++ Downloading armnn"
 91 | 
 92 |   git clone git@github.com:ARM-software/armnn armnn
 93 |   AssertZeroExitCode "Cloning armnn failed"
 94 | fi
 95 | 
 96 | if [ ! -d clframework ]; then
 97 |   echo "++ Downloading clframework"
 98 | 
 99 |   git clone git@github.com:ARM-software/ComputeLibrary clframework
100 |   AssertZeroExitCode "Cloning clframework failed"
101 | fi
102 | 
103 | # Get scons to create the generated source code which clframework needs to compile.
104 | # This is required for the Android build system to build clframework (see below)
105 | pushd clframework
106 | scons os=android build=embed_only neon=0 opencl=1 embed_kernels=1 validation_tests=0 \
107 |     arch=arm64-v8.2-a build_dir=android-arm64v8.2-a benchmark_tests=0 -j16 \
108 |     build/android-arm64v8.2-a/src/core/arm_compute_version.embed build/android-arm64v8.2-a/src/core/CL/cl_kernels
109 | AssertZeroExitCode "Precompiling clframework failed for v82.a"
110 | 
111 | scons os=android build=embed_only neon=0 opencl=1 embed_kernels=1 validation_tests=0 \
112 |     arch=arm64-v8a build_dir=android-arm64v8a benchmark_tests=0 -j16 \
113 |     build/android-arm64v8a/src/core/arm_compute_version.embed build/android-arm64v8a/src/core/CL/cl_kernels
114 | AssertZeroExitCode "Precompiling clframework failed for v8a."
115 | popd
116 | 
117 | if [ ! -d armnn/generated ]; then
118 |   mkdir -p armnn/generated
119 | fi
120 | 
121 | echo "+++ Generating new ArmnnSchema_generated.h"
122 | $FLATBUFFERS_DIR/bin/flatc -o armnn/generated --cpp armnn/src/armnnSerializer/ArmnnSchema.fbs
123 | AssertZeroExitCode "Generating ArmnnSchema_generated.h failed."
124 | 


--------------------------------------------------------------------------------
/test/1.0/Convolution2D.cpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #include "../Convolution2D.hpp"
 7 | 
 8 | #include <log/log.h>
 9 | 
10 | #include <OperationsUtils.h>
11 | 
12 | using namespace android::hardware;
13 | using namespace driverTestHelpers;
14 | using namespace armnn_driver;
15 | 
16 | namespace driverTestHelpers
17 | {
18 | 
19 | void SetModelFp16Flag(V1_0::Model&, bool)
20 | {
21 |     // Nothing to do, the V1_0::Model does not support fp16 precision relaxation.
22 |     // This function is used for compatibility only.
23 | }
24 | 
25 | } // namespace driverTestHelpers
26 | 
27 | DOCTEST_TEST_SUITE("Convolution2DTests_1.0")
28 | {
29 | 
30 | DOCTEST_TEST_CASE("ConvValidPadding_Hal_1_0")
31 | {
32 |     PaddingTestImpl<hal_1_0::HalPolicy>(android::nn::kPaddingValid);
33 | }
34 | 
35 | DOCTEST_TEST_CASE("ConvSamePadding_Hal_1_0")
36 | {
37 |     PaddingTestImpl<hal_1_0::HalPolicy>(android::nn::kPaddingSame);
38 | }
39 | 
40 | }
41 | 


--------------------------------------------------------------------------------
/test/1.0/FullyConnectedReshape.cpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #include "../DriverTestHelpers.hpp"
 7 | 
 8 | DOCTEST_TEST_SUITE("FullyConnectedReshapeTests")
 9 | {
10 | DOCTEST_TEST_CASE("TestFlattenFullyConnectedInput")
11 | {
12 |     using armnn::TensorShape;
13 | 
14 |     // Pass through 2d input
15 |     DOCTEST_CHECK(FlattenFullyConnectedInput(TensorShape({2,2048}),
16 |                                              TensorShape({512, 2048})) == TensorShape({2, 2048}));
17 | 
18 |     // Trivial flattening of batched channels
19 |     DOCTEST_CHECK(FlattenFullyConnectedInput(TensorShape({97,1,1,2048}),
20 |                                              TensorShape({512, 2048})) == TensorShape({97, 2048}));
21 | 
22 |     // Flatten single batch of rows
23 |     DOCTEST_CHECK(FlattenFullyConnectedInput(TensorShape({1,97,1,2048}),
24 |                                              TensorShape({512, 2048})) == TensorShape({97, 2048}));
25 | 
26 |     // Flatten single batch of columns
27 |     DOCTEST_CHECK(FlattenFullyConnectedInput(TensorShape({1,1,97,2048}),
28 |                                              TensorShape({512, 2048})) == TensorShape({97, 2048}));
29 | 
30 |     // Move batches into input dimension
31 |     DOCTEST_CHECK(FlattenFullyConnectedInput(TensorShape({50,1,1,10}),
32 |                                              TensorShape({512, 20})) == TensorShape({25, 20}));
33 | 
34 |     // Flatten single batch of 3D data (e.g. convolution output)
35 |     DOCTEST_CHECK(FlattenFullyConnectedInput(TensorShape({1,16,16,10}),
36 |                                              TensorShape({512, 2560})) == TensorShape({1, 2560}));
37 | }
38 | 
39 | }
40 | 


--------------------------------------------------------------------------------
/test/1.0/Lstm.cpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #include "../Lstm.hpp"
 7 | 
 8 | using namespace armnn_driver;
 9 | 
10 | DOCTEST_TEST_SUITE("LstmTests_1.0_CpuRef")
11 | {
12 | 
13 |     DOCTEST_TEST_CASE("LstmNoCifgNoPeepholeNoProjectionTest_1.0_armnn::Compute::CpuRef")
14 |     {
15 |         LstmNoCifgNoPeepholeNoProjection<hal_1_0::HalPolicy>(armnn::Compute::CpuRef);
16 |     }
17 | 
18 |     DOCTEST_TEST_CASE("LstmCifgPeepholeNoProjectionTest_1.0_CpuRef")
19 |     {
20 |         LstmCifgPeepholeNoProjection<hal_1_0::HalPolicy>(armnn::Compute::CpuRef);
21 |     }
22 | 
23 |     DOCTEST_TEST_CASE("LstmNoCifgPeepholeProjectionTest_1.0_CpuRef")
24 |     {
25 |         LstmNoCifgPeepholeProjection<hal_1_0::HalPolicy>(armnn::Compute::CpuRef);
26 |     }
27 | 
28 |     DOCTEST_TEST_CASE("LstmCifgPeepholeNoProjectionBatch2Test_1.0_CpuRef")
29 |     {
30 |         LstmCifgPeepholeNoProjectionBatch2<hal_1_0::HalPolicy>(armnn::Compute::CpuRef);
31 |     }
32 | 
33 | }
34 | 
35 | #if defined(ARMCOMPUTECL_ENABLED)
36 | DOCTEST_TEST_SUITE("LstmTests_1.0_GpuAcc")
37 | {
38 | 
39 |     DOCTEST_TEST_CASE("LstmNoCifgNoPeepholeNoProjectionTest_1.0_GpuAcc")
40 |     {
41 |         LstmNoCifgNoPeepholeNoProjection<hal_1_0::HalPolicy>(armnn::Compute::GpuAcc);
42 |     }
43 | 
44 |     DOCTEST_TEST_CASE("LstmCifgPeepholeNoProjectionTest_1.0_GpuAcc")
45 |     {
46 |         LstmCifgPeepholeNoProjection<hal_1_0::HalPolicy>(armnn::Compute::GpuAcc);
47 |     }
48 | 
49 |     DOCTEST_TEST_CASE("LstmNoCifgPeepholeProjectionTest_1.0_GpuAcc")
50 |     {
51 |         LstmNoCifgPeepholeProjection<hal_1_0::HalPolicy>(armnn::Compute::GpuAcc);
52 |     }
53 | 
54 |     DOCTEST_TEST_CASE("LstmCifgPeepholeNoProjectionBatch2Test_1.0_GpuAcc")
55 |     {
56 |         LstmCifgPeepholeNoProjectionBatch2<hal_1_0::HalPolicy>(armnn::Compute::GpuAcc);
57 |     }
58 | 
59 | }
60 | #endif
61 | 


--------------------------------------------------------------------------------
/test/1.1/Convolution2D.cpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #include "../Convolution2D.hpp"
 7 | 
 8 | #include <log/log.h>
 9 | 
10 | #include <OperationsUtils.h>
11 | 
12 | using namespace android::hardware;
13 | using namespace driverTestHelpers;
14 | using namespace armnn_driver;
15 | 
16 | namespace driverTestHelpers
17 | {
18 | 
19 | void SetModelFp16Flag(V1_1::Model& model, bool fp16Enabled)
20 | {
21 |     // Set the fp16 flag in the given model
22 |     model.relaxComputationFloat32toFloat16 = fp16Enabled;
23 | }
24 | 
25 | } // namespace driverTestHelpers
26 | 
27 | 
28 | DOCTEST_TEST_SUITE("Convolution2DTests_1.1")
29 | {
30 | 
31 | DOCTEST_TEST_CASE("ConvValidPadding_Hal_1_1")
32 | {
33 |     PaddingTestImpl<hal_1_1::HalPolicy>(android::nn::kPaddingValid);
34 | }
35 | 
36 | DOCTEST_TEST_CASE("ConvSamePadding_Hal_1_1")
37 | {
38 |     PaddingTestImpl<hal_1_1::HalPolicy>(android::nn::kPaddingSame);
39 | }
40 | 
41 | DOCTEST_TEST_CASE("ConvValidPaddingFp16Flag_Hal_1_1")
42 | {
43 |     PaddingTestImpl<hal_1_1::HalPolicy>(android::nn::kPaddingValid, true);
44 | }
45 | 
46 | DOCTEST_TEST_CASE("ConvSamePaddingFp16Flag_Hal_1_1")
47 | {
48 |     PaddingTestImpl<hal_1_1::HalPolicy>(android::nn::kPaddingSame, true);
49 | }
50 | 
51 | }
52 | 


--------------------------------------------------------------------------------
/test/1.1/Lstm.cpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #include "../Lstm.hpp"
 7 | 
 8 | using namespace armnn_driver;
 9 | 
10 | DOCTEST_TEST_SUITE("LstmTests_1.1_CpuRef")
11 | {
12 | 
13 |     DOCTEST_TEST_CASE("LstmNoCifgNoPeepholeNoProjectionTest_1.1_armnn::Compute::CpuRef")
14 |     {
15 |         LstmNoCifgNoPeepholeNoProjection<hal_1_1::HalPolicy>(armnn::Compute::CpuRef);
16 |     }
17 | 
18 |     DOCTEST_TEST_CASE("LstmCifgPeepholeNoProjectionTest_1.1_CpuRef")
19 |     {
20 |         LstmCifgPeepholeNoProjection<hal_1_1::HalPolicy>(armnn::Compute::CpuRef);
21 |     }
22 | 
23 |     DOCTEST_TEST_CASE("LstmNoCifgPeepholeProjectionTest_1.1_CpuRef")
24 |     {
25 |         LstmNoCifgPeepholeProjection<hal_1_1::HalPolicy>(armnn::Compute::CpuRef);
26 |     }
27 | 
28 |     DOCTEST_TEST_CASE("LstmCifgPeepholeNoProjectionBatch2Test_1.1_CpuRef")
29 |     {
30 |         LstmCifgPeepholeNoProjectionBatch2<hal_1_1::HalPolicy>(armnn::Compute::CpuRef);
31 |     }
32 | 
33 | }
34 | 
35 | #if defined(ARMCOMPUTECL_ENABLED)
36 | DOCTEST_TEST_SUITE("LstmTests_1.1_GpuAcc")
37 | {
38 | 
39 |     DOCTEST_TEST_CASE("LstmNoCifgNoPeepholeNoProjectionTest_1.1_GpuAcc")
40 |     {
41 |         LstmNoCifgNoPeepholeNoProjection<hal_1_1::HalPolicy>(armnn::Compute::GpuAcc);
42 |     }
43 | 
44 |     DOCTEST_TEST_CASE("LstmCifgPeepholeNoProjectionTest_1.1_GpuAcc")
45 |     {
46 |         LstmCifgPeepholeNoProjection<hal_1_1::HalPolicy>(armnn::Compute::GpuAcc);
47 |     }
48 | 
49 |     DOCTEST_TEST_CASE("LstmNoCifgPeepholeProjectionTest_1.1_GpuAcc")
50 |     {
51 |         LstmNoCifgPeepholeProjection<hal_1_1::HalPolicy>(armnn::Compute::GpuAcc);
52 |     }
53 | 
54 |     DOCTEST_TEST_CASE("LstmCifgPeepholeNoProjectionBatch2Test_1.1_GpuAcc")
55 |     {
56 |         LstmCifgPeepholeNoProjectionBatch2<hal_1_1::HalPolicy>(armnn::Compute::GpuAcc);
57 |     }
58 | 
59 | }
60 | #endif
61 | 


--------------------------------------------------------------------------------
/test/1.1/Transpose.cpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #include "../DriverTestHelpers.hpp"
  7 | #include "../TestTensor.hpp"
  8 | #include <1.1/HalPolicy.hpp>
  9 | 
 10 | #include <log/log.h>
 11 | #include <OperationsUtils.h>
 12 | 
 13 | #include <array>
 14 | #include <cmath>
 15 | 
 16 | using namespace android::hardware;
 17 | using namespace driverTestHelpers;
 18 | using namespace armnn_driver;
 19 | 
 20 | using HalPolicy = hal_1_1::HalPolicy;
 21 | using RequestArgument = V1_0::RequestArgument;
 22 | 
 23 | namespace
 24 | {
 25 | 
 26 | void TransposeTestImpl(const TestTensor & inputs, int32_t perm[],
 27 |                        const TestTensor & expectedOutputTensor, armnn::Compute computeDevice)
 28 | {
 29 |     auto driver = std::make_unique<ArmnnDriver>(DriverOptions(computeDevice));
 30 |     HalPolicy::Model model = {};
 31 | 
 32 |     AddInputOperand<HalPolicy>(model,inputs.GetDimensions());
 33 | 
 34 |     AddTensorOperand<HalPolicy>(model,
 35 |                                 hidl_vec<uint32_t>{4},
 36 |                                 perm,
 37 |                                 HalPolicy::OperandType::TENSOR_INT32);
 38 | 
 39 |     AddOutputOperand<HalPolicy>(model, expectedOutputTensor.GetDimensions());
 40 | 
 41 |     model.operations.resize(1);
 42 |     model.operations[0].type = HalPolicy::OperationType::TRANSPOSE;
 43 |     model.operations[0].inputs  = hidl_vec<uint32_t>{0, 1};
 44 |     model.operations[0].outputs = hidl_vec<uint32_t>{2};
 45 | 
 46 |     android::sp<V1_0::IPreparedModel> preparedModel = PrepareModel(model, *driver);
 47 | 
 48 |     // the request's memory pools will follow the same order as
 49 |     // the inputs
 50 |     V1_0::DataLocation inloc = {};
 51 |     inloc.poolIndex          = 0;
 52 |     inloc.offset             = 0;
 53 |     inloc.length             = inputs.GetNumElements() * sizeof(float);
 54 |     RequestArgument input    = {};
 55 |     input.location           = inloc;
 56 |     input.dimensions         = inputs.GetDimensions();
 57 | 
 58 |     // and an additional memory pool is needed for the output
 59 |     V1_0::DataLocation outloc = {};
 60 |     outloc.poolIndex          = 1;
 61 |     outloc.offset             = 0;
 62 |     outloc.length             = expectedOutputTensor.GetNumElements() * sizeof(float);
 63 |     RequestArgument output    = {};
 64 |     output.location           = outloc;
 65 |     output.dimensions         = expectedOutputTensor.GetDimensions();
 66 | 
 67 |     // make the request based on the arguments
 68 |     V1_0::Request request = {};
 69 |     request.inputs  = hidl_vec<RequestArgument>{input};
 70 |     request.outputs = hidl_vec<RequestArgument>{output};
 71 | 
 72 |     // set the input data
 73 |     AddPoolAndSetData(inputs.GetNumElements(),
 74 |                       request,
 75 |                       inputs.GetData());
 76 | 
 77 |     // add memory for the output
 78 |     android::sp<IMemory> outMemory = AddPoolAndGetData<float>(expectedOutputTensor.GetNumElements(), request);
 79 |     float* outdata = static_cast<float*>(static_cast<void*>(outMemory->getPointer()));
 80 | 
 81 |     if (preparedModel.get() != nullptr)
 82 |     {
 83 |         auto execStatus = Execute(preparedModel, request);
 84 |     }
 85 | 
 86 |     const float * expectedOutput = expectedOutputTensor.GetData();
 87 |     for (unsigned int i = 0; i < expectedOutputTensor.GetNumElements(); ++i)
 88 |     {
 89 |         DOCTEST_CHECK(outdata[i] == expectedOutput[i]);
 90 |     }
 91 | }
 92 | 
 93 | } // namespace
 94 | 
 95 | DOCTEST_TEST_SUITE("TransposeTests_CpuRef")
 96 | {
 97 |     DOCTEST_TEST_CASE("Transpose_CpuRef")
 98 |     {
 99 |         int32_t perm[] = {2, 3, 1, 0};
100 |         TestTensor input{armnn::TensorShape{1, 2, 2, 2},{1, 2, 3, 4, 5, 6, 7, 8}};
101 |         TestTensor expected{armnn::TensorShape{2, 2, 2, 1},{1, 5, 2, 6, 3, 7, 4, 8}};
102 | 
103 |         TransposeTestImpl(input, perm, expected, armnn::Compute::CpuRef);
104 |     }
105 | 
106 |     DOCTEST_TEST_CASE("TransposeNHWCToArmNN_CpuRef")
107 |     {
108 |         int32_t perm[] = {0, 3, 1, 2};
109 |         TestTensor input{armnn::TensorShape{1, 2, 2, 3},{1, 2, 3, 11, 12, 13, 21, 22, 23, 31, 32, 33}};
110 |         TestTensor expected{armnn::TensorShape{1, 3, 2, 2},{1, 11, 21, 31, 2, 12, 22, 32, 3, 13, 23, 33}};
111 | 
112 |         TransposeTestImpl(input, perm, expected, armnn::Compute::CpuRef);
113 |     }
114 |     DOCTEST_TEST_CASE("TransposeArmNNToNHWC_CpuRef")
115 |     {
116 |         int32_t perm[] = {0, 2, 3, 1};
117 |         TestTensor input{armnn::TensorShape{1, 2, 2, 2},{1, 2, 3, 4, 5, 6, 7, 8}};
118 |         TestTensor expected{armnn::TensorShape{1, 2, 2, 2},{1, 5, 2, 6, 3, 7, 4, 8}};
119 | 
120 |         TransposeTestImpl(input, perm, expected, armnn::Compute::CpuRef);
121 |     }
122 | }
123 | 
124 | #ifdef ARMCOMPUTECL_ENABLED
125 | DOCTEST_TEST_SUITE("TransposeTests_CpuAcc")
126 | {
127 |     DOCTEST_TEST_CASE("Transpose_CpuAcc")
128 |     {
129 |         int32_t perm[] = {2, 3, 1, 0};
130 |         TestTensor input{armnn::TensorShape{1, 2, 2, 2},{1, 2, 3, 4, 5, 6, 7, 8}};
131 |         TestTensor expected{armnn::TensorShape{2, 2, 2, 1},{1, 5, 2, 6, 3, 7, 4, 8}};
132 | 
133 |         TransposeTestImpl(input, perm, expected, armnn::Compute::CpuAcc);
134 |     }
135 | 
136 |     DOCTEST_TEST_CASE("TransposeNHWCToArmNN_CpuAcc")
137 |     {
138 |         int32_t perm[] = {0, 3, 1, 2};
139 |         TestTensor input{armnn::TensorShape{1, 2, 2, 3},{1, 2, 3, 11, 12, 13, 21, 22, 23, 31, 32, 33}};
140 |         TestTensor expected{armnn::TensorShape{1, 3, 2, 2},{1, 11, 21, 31, 2, 12, 22, 32, 3, 13, 23, 33}};
141 | 
142 |         TransposeTestImpl(input, perm, expected, armnn::Compute::CpuAcc);
143 |     }
144 | 
145 |     DOCTEST_TEST_CASE("TransposeArmNNToNHWC_CpuAcc")
146 |     {
147 |         int32_t perm[] = {0, 2, 3, 1};
148 |         TestTensor input{armnn::TensorShape{1, 2, 2, 2},{1, 2, 3, 4, 5, 6, 7, 8}};
149 |         TestTensor expected{armnn::TensorShape{1, 2, 2, 2},{1, 5, 2, 6, 3, 7, 4, 8}};
150 | 
151 |         TransposeTestImpl(input, perm, expected, armnn::Compute::CpuAcc);
152 |     }
153 | }
154 | 
155 | DOCTEST_TEST_SUITE("TransposeTests_GpuAcc")
156 | {
157 |     DOCTEST_TEST_CASE("Transpose_GpuAcc")
158 |     {
159 |         int32_t perm[] = {2, 3, 1, 0};
160 |         TestTensor input{armnn::TensorShape{1, 2, 2, 2},{1, 2, 3, 4, 5, 6, 7, 8}};
161 |         TestTensor expected{armnn::TensorShape{2, 2, 2, 1},{1, 5, 2, 6, 3, 7, 4, 8}};
162 | 
163 |         TransposeTestImpl(input, perm, expected, armnn::Compute::GpuAcc);
164 |     }
165 | 
166 |     DOCTEST_TEST_CASE("TransposeNHWCToArmNN_GpuAcc")
167 |     {
168 |         int32_t perm[] = {0, 3, 1, 2};
169 |         TestTensor input{armnn::TensorShape{1, 2, 2, 3},{1, 2, 3, 11, 12, 13, 21, 22, 23, 31, 32, 33}};
170 |         TestTensor expected{armnn::TensorShape{1, 3, 2, 2},{1, 11, 21, 31, 2, 12, 22, 32, 3, 13, 23, 33}};
171 | 
172 |         TransposeTestImpl(input, perm, expected, armnn::Compute::GpuAcc);
173 |     }
174 | 
175 |     DOCTEST_TEST_CASE("TransposeArmNNToNHWC_GpuAcc")
176 |     {
177 |         int32_t perm[] = {0, 2, 3, 1};
178 |         TestTensor input{armnn::TensorShape{1, 2, 2, 2},{1, 2, 3, 4, 5, 6, 7, 8}};
179 |         TestTensor expected{armnn::TensorShape{1, 2, 2, 2},{1, 5, 2, 6, 3, 7, 4, 8}};
180 | 
181 |         TransposeTestImpl(input, perm, expected, armnn::Compute::GpuAcc);
182 |     }
183 | }
184 | #endif
185 | 
186 | 


--------------------------------------------------------------------------------
/test/1.2/Capabilities.cpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #include "../DriverTestHelpers.hpp"
  7 | #include "Utils.h"
  8 | 
  9 | #include <1.2/ArmnnDriverImpl.hpp>
 10 | 
 11 | #include <sys/system_properties.h>
 12 | 
 13 | #include <cfloat>
 14 | 
 15 | using namespace std;
 16 | 
 17 | struct CapabilitiesFixture
 18 | {
 19 |     CapabilitiesFixture()
 20 |     {
 21 |         // CleanUp before the execution of each test
 22 |         CleanUp();
 23 |     }
 24 | 
 25 |     ~CapabilitiesFixture()
 26 |     {
 27 |         // CleanUp after the execution of each test
 28 |         CleanUp();
 29 |     }
 30 | 
 31 |     void CleanUp()
 32 |     {
 33 |         const char* nullStr = "";
 34 | 
 35 |         __system_property_set("Armnn.operandTypeTensorFloat32Performance.execTime", nullStr);
 36 |         __system_property_set("Armnn.operandTypeTensorFloat32Performance.powerUsage", nullStr);
 37 |         __system_property_set("Armnn.operandTypeFloat32Performance.execTime", nullStr);
 38 |         __system_property_set("Armnn.operandTypeFloat32Performance.powerUsage", nullStr);
 39 |         __system_property_set("Armnn.operandTypeTensorFloat16Performance.execTime", nullStr);
 40 |         __system_property_set("Armnn.operandTypeTensorFloat16Performance.powerUsage", nullStr);
 41 |         __system_property_set("Armnn.operandTypeFloat16Performance.execTime", nullStr);
 42 |         __system_property_set("Armnn.operandTypeFloat16Performance.powerUsage", nullStr);
 43 |         __system_property_set("Armnn.operandTypeTensorQuant8AsymmPerformance.execTime", nullStr);
 44 |         __system_property_set("Armnn.operandTypeTensorQuant8AsymmPerformance.powerUsage", nullStr);
 45 |         __system_property_set("Armnn.operandTypeTensorQuant16SymmPerformance.execTime", nullStr);
 46 |         __system_property_set("Armnn.operandTypeTensorQuant16SymmPerformance.powerUsage", nullStr);
 47 |         __system_property_set("Armnn.operandTypeTensorInt32Performance.execTime", nullStr);
 48 |         __system_property_set("Armnn.operandTypeTensorInt32Performance.powerUsage", nullStr);
 49 |         __system_property_set("Armnn.operandTypeInt32Performance.execTime", nullStr);
 50 |         __system_property_set("Armnn.operandTypeInt32Performance.powerUsage", nullStr);
 51 |         __system_property_set("Armnn.operandTypeTensorQuant8SymmPerformance.execTime", nullStr);
 52 |         __system_property_set("Armnn.operandTypeTensorQuant8SymmPerformance.powerUsage", nullStr);
 53 |         __system_property_set("Armnn.operandTypeTensorQuant8SymmPerChannelPerformance.execTime", nullStr);
 54 |         __system_property_set("Armnn.operandTypeTensorQuant8SymmPerChannelPerformance.powerUsage", nullStr);
 55 |     }
 56 | };
 57 | 
 58 | void CheckOperandType(const V1_2::Capabilities& capabilities, V1_2::OperandType type, float execTime, float powerUsage)
 59 | {
 60 |     using namespace armnn_driver::hal_1_2;
 61 |     V1_0::PerformanceInfo perfInfo = android::nn::lookup(capabilities.operandPerformance, type);
 62 |     DOCTEST_CHECK(perfInfo.execTime == execTime);
 63 |     DOCTEST_CHECK(perfInfo.powerUsage == powerUsage);
 64 | }
 65 | 
 66 | DOCTEST_TEST_SUITE("CapabilitiesTests")
 67 | {
 68 | DOCTEST_TEST_CASE_FIXTURE(CapabilitiesFixture, "PerformanceCapabilitiesWithRuntime")
 69 | {
 70 |     using namespace android::nn;
 71 | 
 72 |     auto getCapabilitiesFn = [&](V1_0::ErrorStatus error, const V1_2::Capabilities& capabilities)
 73 |         {
 74 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_FLOAT32, 2.0f, 2.1f);
 75 |             CheckOperandType(capabilities, V1_2::OperandType::FLOAT32, 2.2f, 2.3f);
 76 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_FLOAT16, 2.4f, 2.5f);
 77 |             CheckOperandType(capabilities, V1_2::OperandType::FLOAT16, 2.6f, 2.7f);
 78 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_QUANT8_ASYMM, 2.8f, 2.9f);
 79 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_QUANT16_SYMM, 3.0f, 3.1f);
 80 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_INT32, 3.2f, 3.3f);
 81 |             CheckOperandType(capabilities, V1_2::OperandType::INT32, 3.4f, 3.5f);
 82 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_QUANT8_SYMM, 2.8f, 2.9f);
 83 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_QUANT8_SYMM_PER_CHANNEL, 2.8f, 2.9f);
 84 | 
 85 |             // Unsupported operands take FLT_MAX value
 86 |             CheckOperandType(capabilities, V1_2::OperandType::UINT32, FLT_MAX, FLT_MAX);
 87 |             CheckOperandType(capabilities, V1_2::OperandType::BOOL, FLT_MAX, FLT_MAX);
 88 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_QUANT16_ASYMM, FLT_MAX, FLT_MAX);
 89 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_BOOL8, FLT_MAX, FLT_MAX);
 90 |             CheckOperandType(capabilities, V1_2::OperandType::OEM, FLT_MAX, FLT_MAX);
 91 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_OEM_BYTE, FLT_MAX, FLT_MAX);
 92 | 
 93 |             bool result = (error == V1_0::ErrorStatus::NONE);
 94 |             DOCTEST_CHECK(result);
 95 |         };
 96 | 
 97 |     __system_property_set("Armnn.operandTypeTensorFloat32Performance.execTime", "2.0f");
 98 |     __system_property_set("Armnn.operandTypeTensorFloat32Performance.powerUsage", "2.1f");
 99 |     __system_property_set("Armnn.operandTypeFloat32Performance.execTime", "2.2f");
100 |     __system_property_set("Armnn.operandTypeFloat32Performance.powerUsage", "2.3f");
101 |     __system_property_set("Armnn.operandTypeTensorFloat16Performance.execTime", "2.4f");
102 |     __system_property_set("Armnn.operandTypeTensorFloat16Performance.powerUsage", "2.5f");
103 |     __system_property_set("Armnn.operandTypeFloat16Performance.execTime", "2.6f");
104 |     __system_property_set("Armnn.operandTypeFloat16Performance.powerUsage", "2.7f");
105 |     __system_property_set("Armnn.operandTypeTensorQuant8AsymmPerformance.execTime", "2.8f");
106 |     __system_property_set("Armnn.operandTypeTensorQuant8AsymmPerformance.powerUsage", "2.9f");
107 |     __system_property_set("Armnn.operandTypeTensorQuant16SymmPerformance.execTime", "3.0f");
108 |     __system_property_set("Armnn.operandTypeTensorQuant16SymmPerformance.powerUsage", "3.1f");
109 |     __system_property_set("Armnn.operandTypeTensorInt32Performance.execTime", "3.2f");
110 |     __system_property_set("Armnn.operandTypeTensorInt32Performance.powerUsage", "3.3f");
111 |     __system_property_set("Armnn.operandTypeInt32Performance.execTime", "3.4f");
112 |     __system_property_set("Armnn.operandTypeInt32Performance.powerUsage", "3.5f");
113 |     __system_property_set("Armnn.operandTypeTensorQuant8SymmPerformance.execTime", "2.8f");
114 |     __system_property_set("Armnn.operandTypeTensorQuant8SymmPerformance.powerUsage", "2.9f");
115 |     __system_property_set("Armnn.operandTypeTensorQuant8SymmPerChannelPerformance.execTime", "2.8f");
116 |     __system_property_set("Armnn.operandTypeTensorQuant8SymmPerChannelPerformance.powerUsage", "2.9f");
117 | 
118 |     armnn::IRuntime::CreationOptions options;
119 |     armnn::IRuntimePtr runtime(armnn::IRuntime::Create(options));
120 | 
121 |     armnn_driver::hal_1_2::ArmnnDriverImpl::getCapabilities_1_2(runtime, getCapabilitiesFn);
122 | }
123 | 
124 | DOCTEST_TEST_CASE_FIXTURE(CapabilitiesFixture, "PerformanceCapabilitiesUndefined")
125 | {
126 |     using namespace android::nn;
127 | 
128 |     float defaultValue = .1f;
129 | 
130 |     auto getCapabilitiesFn = [&](V1_0::ErrorStatus error, const V1_2::Capabilities& capabilities)
131 |         {
132 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_FLOAT32, defaultValue, defaultValue);
133 |             CheckOperandType(capabilities, V1_2::OperandType::FLOAT32, defaultValue, defaultValue);
134 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_FLOAT16, defaultValue, defaultValue);
135 |             CheckOperandType(capabilities, V1_2::OperandType::FLOAT16, defaultValue, defaultValue);
136 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_QUANT8_ASYMM, defaultValue, defaultValue);
137 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_QUANT16_SYMM, defaultValue, defaultValue);
138 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_INT32, defaultValue, defaultValue);
139 |             CheckOperandType(capabilities, V1_2::OperandType::INT32, defaultValue, defaultValue);
140 |             CheckOperandType(capabilities,
141 |                              V1_2::OperandType::TENSOR_QUANT8_SYMM_PER_CHANNEL,
142 |                              defaultValue,
143 |                              defaultValue);
144 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_QUANT8_SYMM, defaultValue, defaultValue);
145 | 
146 |             // Unsupported operands take FLT_MAX value
147 |             CheckOperandType(capabilities, V1_2::OperandType::UINT32, FLT_MAX, FLT_MAX);
148 |             CheckOperandType(capabilities, V1_2::OperandType::BOOL, FLT_MAX, FLT_MAX);
149 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_QUANT16_ASYMM, FLT_MAX, FLT_MAX);
150 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_BOOL8, FLT_MAX, FLT_MAX);
151 |             CheckOperandType(capabilities, V1_2::OperandType::OEM, FLT_MAX, FLT_MAX);
152 |             CheckOperandType(capabilities, V1_2::OperandType::TENSOR_OEM_BYTE, FLT_MAX, FLT_MAX);
153 | 
154 |             bool result = (error == V1_0::ErrorStatus::NONE);
155 |             DOCTEST_CHECK(result);
156 |         };
157 | 
158 |     armnn::IRuntime::CreationOptions options;
159 |     armnn::IRuntimePtr runtime(armnn::IRuntime::Create(options));
160 | 
161 |     armnn_driver::hal_1_2::ArmnnDriverImpl::getCapabilities_1_2(runtime, getCapabilitiesFn);
162 | }
163 | 
164 | }


--------------------------------------------------------------------------------
/test/1.2/Dilation.cpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #include "../Dilation.hpp"
 7 | 
 8 | #include <1.2/HalPolicy.hpp>
 9 | 
10 | DOCTEST_TEST_SUITE("DilationTests")
11 | {
12 | 
13 | DOCTEST_TEST_CASE("ConvolutionExplicitPaddingNoDilation")
14 | {
15 |     DilationTestOptions options;
16 |     options.m_IsDepthwiseConvolution = false;
17 |     options.m_IsPaddingExplicit      = true;
18 |     options.m_HasDilation            = false;
19 | 
20 |     DilationTestImpl<hal_1_2::HalPolicy>(options);
21 | }
22 | 
23 | DOCTEST_TEST_CASE("ConvolutionExplicitPaddingDilation")
24 | {
25 |     DilationTestOptions options;
26 |     options.m_IsDepthwiseConvolution = false;
27 |     options.m_IsPaddingExplicit      = true;
28 |     options.m_HasDilation            = true;
29 | 
30 |     DilationTestImpl<hal_1_2::HalPolicy>(options);
31 | }
32 | 
33 | DOCTEST_TEST_CASE("ConvolutionImplicitPaddingNoDilation")
34 | {
35 |     DilationTestOptions options;
36 |     options.m_IsDepthwiseConvolution = false;
37 |     options.m_IsPaddingExplicit      = false;
38 |     options.m_HasDilation            = false;
39 | 
40 |     DilationTestImpl<hal_1_2::HalPolicy>(options);
41 | }
42 | 
43 | DOCTEST_TEST_CASE("ConvolutionImplicitPaddingDilation")
44 | {
45 |     DilationTestOptions options;
46 |     options.m_IsDepthwiseConvolution = false;
47 |     options.m_IsPaddingExplicit      = false;
48 |     options.m_HasDilation            = true;
49 | 
50 |     DilationTestImpl<hal_1_2::HalPolicy>(options);
51 | }
52 | 
53 | DOCTEST_TEST_CASE("DepthwiseConvolutionExplicitPaddingNoDilation")
54 | {
55 |     DilationTestOptions options;
56 |     options.m_IsDepthwiseConvolution = true;
57 |     options.m_IsPaddingExplicit      = true;
58 |     options.m_HasDilation            = false;
59 | 
60 |     DilationTestImpl<hal_1_2::HalPolicy>(options);
61 | }
62 | 
63 | DOCTEST_TEST_CASE("DepthwiseConvolutionExplicitPaddingDilation")
64 | {
65 |     DilationTestOptions options;
66 |     options.m_IsDepthwiseConvolution = true;
67 |     options.m_IsPaddingExplicit      = true;
68 |     options.m_HasDilation            = true;
69 | 
70 |     DilationTestImpl<hal_1_2::HalPolicy>(options);
71 | }
72 | 
73 | DOCTEST_TEST_CASE("DepthwiseConvolutionImplicitPaddingNoDilation")
74 | {
75 |     DilationTestOptions options;
76 |     options.m_IsDepthwiseConvolution = true;
77 |     options.m_IsPaddingExplicit      = false;
78 |     options.m_HasDilation            = false;
79 | 
80 |     DilationTestImpl<hal_1_2::HalPolicy>(options);
81 | }
82 | 
83 | DOCTEST_TEST_CASE("DepthwiseConvolutionImplicitPaddingDilation")
84 | {
85 |     DilationTestOptions options;
86 |     options.m_IsDepthwiseConvolution = true;
87 |     options.m_IsPaddingExplicit      = false;
88 |     options.m_HasDilation            = true;
89 | 
90 |     DilationTestImpl<hal_1_2::HalPolicy>(options);
91 | }
92 | 
93 | }


--------------------------------------------------------------------------------
/test/1.2/Lstm.cpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #include "../Lstm.hpp"
 7 | 
 8 | using namespace armnn_driver;
 9 | 
10 | #if defined(ARMNNREF_ENABLED)
11 | DOCTEST_TEST_SUITE("LstmTests_1.2_CpuRef")
12 | {
13 | 
14 |     DOCTEST_TEST_CASE("LstmNoCifgNoPeepholeNoProjectionTest_1.2_armnn::Compute::CpuRef")
15 |     {
16 |         LstmNoCifgNoPeepholeNoProjection<hal_1_2::HalPolicy>(armnn::Compute::CpuRef);
17 |     }
18 | 
19 |     DOCTEST_TEST_CASE("LstmCifgPeepholeNoProjectionTest_1.2_CpuRef")
20 |     {
21 |         LstmCifgPeepholeNoProjection<hal_1_2::HalPolicy>(armnn::Compute::CpuRef);
22 |     }
23 | 
24 |     DOCTEST_TEST_CASE("LstmNoCifgPeepholeProjectionTest_1.2_CpuRef")
25 |     {
26 |         LstmNoCifgPeepholeProjection<hal_1_2::HalPolicy>(armnn::Compute::CpuRef);
27 |     }
28 | 
29 |     DOCTEST_TEST_CASE("LstmCifgPeepholeNoProjectionBatch2Test_1.2_CpuRef")
30 |     {
31 |         LstmCifgPeepholeNoProjectionBatch2<hal_1_2::HalPolicy>(armnn::Compute::CpuRef);
32 |     }
33 | 
34 |     DOCTEST_TEST_CASE("QuantizedLstmTest_1.2_CpuRef")
35 |     {
36 |         QuantizedLstm<hal_1_2::HalPolicy>(armnn::Compute::CpuRef);
37 |     }
38 | 
39 | }
40 | #endif
41 | 
42 | #if defined(ARMCOMPUTECL_ENABLED)
43 | DOCTEST_TEST_SUITE("LstmTests_1.2_GpuAcc")
44 | {
45 | 
46 |     DOCTEST_TEST_CASE("LstmNoCifgNoPeepholeNoProjectionTest_1.2_GpuAcc")
47 |     {
48 |         LstmNoCifgNoPeepholeNoProjection<hal_1_2::HalPolicy>(armnn::Compute::GpuAcc);
49 |     }
50 | 
51 |     DOCTEST_TEST_CASE("LstmCifgPeepholeNoProjectionTest_1.2_GpuAcc")
52 |     {
53 |         LstmCifgPeepholeNoProjection<hal_1_2::HalPolicy>(armnn::Compute::GpuAcc);
54 |     }
55 | 
56 |     DOCTEST_TEST_CASE("LstmNoCifgPeepholeProjectionTest_1.2_GpuAcc")
57 |     {
58 |         LstmNoCifgPeepholeProjection<hal_1_2::HalPolicy>(armnn::Compute::GpuAcc);
59 |     }
60 | 
61 |     DOCTEST_TEST_CASE("LstmCifgPeepholeNoProjectionBatch2Test_1.2_GpuAcc")
62 |     {
63 |         LstmCifgPeepholeNoProjectionBatch2<hal_1_2::HalPolicy>(armnn::Compute::GpuAcc);
64 |     }
65 | 
66 |     DOCTEST_TEST_CASE("QuantizedLstmTest_1.2_GpuAcc")
67 |     {
68 |         QuantizedLstm<hal_1_2::HalPolicy>(armnn::Compute::GpuAcc);
69 |     }
70 | 
71 | }
72 | #endif
73 | 


--------------------------------------------------------------------------------
/test/1.2/Mean.cpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2022 Arm Ltd and Contributors. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #include "../DriverTestHelpers.hpp"
  7 | #include "../TestHalfTensor.hpp"
  8 | 
  9 | #include <1.2/HalPolicy.hpp>
 10 | 
 11 | #include <array>
 12 | 
 13 | using Half = half_float::half;
 14 | 
 15 | using namespace android::hardware;
 16 | using namespace driverTestHelpers;
 17 | using namespace armnn_driver;
 18 | 
 19 | using HalPolicy = hal_1_2::HalPolicy;
 20 | using RequestArgument = V1_0::RequestArgument;
 21 | 
 22 | namespace
 23 | {
 24 | 
 25 | void MeanTestImpl(const TestHalfTensor& input,
 26 |                   const hidl_vec<uint32_t>& axisDimensions,
 27 |                   const int32_t* axisValues,
 28 |                   int32_t keepDims,
 29 |                   const TestHalfTensor& expectedOutput,
 30 |                   bool fp16Enabled,
 31 |                   armnn::Compute computeDevice)
 32 | {
 33 |     auto driver = std::make_unique<ArmnnDriver>(DriverOptions(computeDevice, fp16Enabled));
 34 | 
 35 |     HalPolicy::Model model = {};
 36 | 
 37 |     AddInputOperand<HalPolicy>(model, input.GetDimensions(), V1_2::OperandType::TENSOR_FLOAT16);
 38 | 
 39 |     AddTensorOperand<HalPolicy>(model,
 40 |                                 axisDimensions,
 41 |                                 const_cast<int32_t*>(axisValues),
 42 |                                 HalPolicy::OperandType::TENSOR_INT32);
 43 | 
 44 |     AddIntOperand<HalPolicy>(model, keepDims);
 45 | 
 46 |     AddOutputOperand<HalPolicy>(model, expectedOutput.GetDimensions(), V1_2::OperandType::TENSOR_FLOAT16);
 47 | 
 48 |     model.operations.resize(1);
 49 |     model.operations[0].type               = HalPolicy::OperationType::MEAN;
 50 |     model.operations[0].inputs             = hidl_vec<uint32_t>{ 0, 1, 2 };
 51 |     model.operations[0].outputs            = hidl_vec<uint32_t>{ 3 };
 52 |     model.relaxComputationFloat32toFloat16 = fp16Enabled;
 53 | 
 54 |     //android::sp<V1_0::IPreparedModel> preparedModel = PrepareModel(model, *driver);
 55 |     android::sp<V1_2::IPreparedModel> preparedModel = PrepareModel_1_2(model, *driver);
 56 | 
 57 |     // The request's memory pools will follow the same order as the inputs
 58 |     V1_0::DataLocation inLoc = {};
 59 |     inLoc.poolIndex          = 0;
 60 |     inLoc.offset             = 0;
 61 |     inLoc.length             = input.GetNumElements() * sizeof(Half);
 62 |     RequestArgument inArg    = {};
 63 |     inArg.location           = inLoc;
 64 |     inArg.dimensions         = input.GetDimensions();
 65 | 
 66 |     // An additional memory pool is needed for the output
 67 |     V1_0::DataLocation outLoc = {};
 68 |     outLoc.poolIndex          = 1;
 69 |     outLoc.offset             = 0;
 70 |     outLoc.length             = expectedOutput.GetNumElements() * sizeof(Half);
 71 |     RequestArgument outArg    = {};
 72 |     outArg.location           = outLoc;
 73 |     outArg.dimensions         = expectedOutput.GetDimensions();
 74 | 
 75 |     // Make the request based on the arguments
 76 |     V1_0::Request request = {};
 77 |     request.inputs  = hidl_vec<RequestArgument>{ inArg };
 78 |     request.outputs = hidl_vec<RequestArgument>{ outArg };
 79 | 
 80 |     // Set the input data
 81 |     AddPoolAndSetData(input.GetNumElements(), request, input.GetData());
 82 | 
 83 |     // Add memory for the output
 84 |     android::sp<IMemory> outMemory = AddPoolAndGetData<Half>(expectedOutput.GetNumElements(), request);
 85 |     const Half* outputData = static_cast<const Half*>(static_cast<void*>(outMemory->getPointer()));
 86 | 
 87 |     if (preparedModel.get() != nullptr)
 88 |     {
 89 |         V1_0::ErrorStatus execStatus = Execute(preparedModel, request);
 90 |         DOCTEST_CHECK((int)execStatus == (int)V1_0::ErrorStatus::NONE);
 91 |     }
 92 | 
 93 |     const Half* expectedOutputData = expectedOutput.GetData();
 94 |     for (unsigned int i = 0; i < expectedOutput.GetNumElements(); i++)
 95 |     {
 96 |         DOCTEST_CHECK(outputData[i] == expectedOutputData[i]);
 97 |     }
 98 | }
 99 | 
100 | } // anonymous namespace
101 | 
102 | DOCTEST_TEST_SUITE("MeanTests_1.2_CpuRef")
103 | {
104 | 
105 | DOCTEST_TEST_CASE("MeanFp16NoKeepDimsTest_CpuRef")
106 | {
107 |     using namespace half_float::literal;
108 | 
109 |     TestHalfTensor input{ armnn::TensorShape{ 4, 3, 2 },
110 |                       { 1.0_h, 2.0_h, 3.0_h, 4.0_h, 5.0_h, 6.0_h, 7.0_h, 8.0_h, 9.0_h, 10.0_h,
111 |                         11.0_h, 12.0_h, 13.0_h, 14.0_h, 15.0_h, 16.0_h, 17.0_h, 18.0_h, 19.0_h,
112 |                         20.0_h, 21.0_h, 22.0_h, 23.0_h, 24.0_h } };
113 |     hidl_vec<uint32_t> axisDimensions = { 2 };
114 |     int32_t axisValues[] = { 0, 1 };
115 |     int32_t keepDims = 0;
116 |     TestHalfTensor expectedOutput{ armnn::TensorShape{ 2 }, { 12.0_h, 13.0_h } };
117 | 
118 |     MeanTestImpl(input, axisDimensions, axisValues, keepDims, expectedOutput, true, armnn::Compute::CpuRef);
119 | }
120 | 
121 | DOCTEST_TEST_CASE("MeanFp16KeepDimsTest_CpuRef")
122 | {
123 |     using namespace half_float::literal;
124 | 
125 |     TestHalfTensor input{ armnn::TensorShape{ 1, 1, 3, 2 }, { 1.0_h, 1.0_h, 2.0_h, 2.0_h, 3.0_h, 3.0_h } };
126 |     hidl_vec<uint32_t> axisDimensions = { 1 };
127 |     int32_t axisValues[] = { 2 };
128 |     int32_t keepDims = 1;
129 |     TestHalfTensor expectedOutput{ armnn::TensorShape{ 1, 1, 1, 2 }, {  2.0_h, 2.0_h } };
130 | 
131 |     MeanTestImpl(input, axisDimensions, axisValues, keepDims, expectedOutput, true, armnn::Compute::CpuRef);
132 | }
133 | 
134 | }
135 | 
136 | #ifdef ARMCOMPUTECL_ENABLED
137 | DOCTEST_TEST_SUITE("MeanTests_1.2_CpuAcc")
138 | {
139 |     DOCTEST_TEST_CASE("MeanFp16NoKeepDimsTest_CpuAcc")
140 |     {
141 |         using namespace half_float::literal;
142 | 
143 |         std::vector<Half> in = { 1.0_h, 2.0_h, 3.0_h, 4.0_h, 5.0_h, 6.0_h, 7.0_h, 8.0_h, 9.0_h, 10.0_h,
144 |                             11.0_h, 12.0_h, 13.0_h, 14.0_h, 15.0_h, 16.0_h, 17.0_h, 18.0_h, 19.0_h,
145 |                             20.0_h, 21.0_h, 22.0_h, 23.0_h, 24.0_h };
146 |         TestHalfTensor input{ armnn::TensorShape{ 4, 3, 2 },
147 |                            in};
148 |         hidl_vec<uint32_t> axisDimensions = { 2 };
149 |         int32_t axisValues[] = { 0, 1 };
150 |         int32_t keepDims = 0;
151 |         std::vector<Half> out = { 12.0_h, 13.0_h };
152 |         TestHalfTensor expectedOutput{ armnn::TensorShape{ 2 }, out };
153 | 
154 |         MeanTestImpl(input, axisDimensions, axisValues, keepDims, expectedOutput, true, armnn::Compute::CpuAcc);
155 |     }
156 | 
157 |     DOCTEST_TEST_CASE("MeanFp16KeepDimsTest_CpuAcc")
158 |     {
159 |         using namespace half_float::literal;
160 | 
161 |         std::vector<Half> in = { 1.0_h, 1.0_h, 2.0_h, 2.0_h, 3.0_h, 3.0_h };
162 |         TestHalfTensor input{ armnn::TensorShape{ 1, 1, 3, 2 }, in };
163 |         hidl_vec<uint32_t> axisDimensions = { 1 };
164 |         int32_t axisValues[] = { 2 };
165 |         int32_t keepDims = 1;
166 |         std::vector<Half> out = {  2.0_h, 2.0_h };
167 |         TestHalfTensor expectedOutput{ armnn::TensorShape{ 1, 1, 1, 2 }, out };
168 | 
169 |         MeanTestImpl(input, axisDimensions, axisValues, keepDims, expectedOutput, true, armnn::Compute::CpuAcc);
170 |     }
171 | }
172 | 
173 | DOCTEST_TEST_SUITE("MeanTests_1.2_GpuAcc")
174 | {
175 |     DOCTEST_TEST_CASE("MeanFp16NoKeepDimsTest_GpuAcc")
176 |     {
177 |         using namespace half_float::literal;
178 | 
179 |         TestHalfTensor input{ armnn::TensorShape{ 4, 3, 2 },
180 |                           { 1.0_h, 2.0_h, 3.0_h, 4.0_h, 5.0_h, 6.0_h, 7.0_h, 8.0_h, 9.0_h, 10.0_h,
181 |                             11.0_h, 12.0_h, 13.0_h, 14.0_h, 15.0_h, 16.0_h, 17.0_h, 18.0_h, 19.0_h,
182 |                             20.0_h, 21.0_h, 22.0_h, 23.0_h, 24.0_h } };
183 |         hidl_vec<uint32_t> axisDimensions = { 2 };
184 |         int32_t axisValues[] = { 0, 1 };
185 |         int32_t keepDims = 0;
186 |         TestHalfTensor expectedOutput{ armnn::TensorShape{ 2 }, { 12.0_h, 13.0_h } };
187 | 
188 |         MeanTestImpl(input, axisDimensions, axisValues, keepDims, expectedOutput, true, armnn::Compute::GpuAcc);
189 |     }
190 | 
191 |     DOCTEST_TEST_CASE("MeanFp16KeepDimsTest_GpuAcc")
192 |     {
193 |         using namespace half_float::literal;
194 | 
195 |         TestHalfTensor input{ armnn::TensorShape{ 1, 1, 3, 2 }, { 1.0_h, 1.0_h, 2.0_h, 2.0_h, 3.0_h, 3.0_h } };
196 |         hidl_vec<uint32_t> axisDimensions = { 1 };
197 |         int32_t axisValues[] = { 2 };
198 |         int32_t keepDims = 1;
199 |         TestHalfTensor expectedOutput{ armnn::TensorShape{ 1, 1, 1, 2 }, {  2.0_h, 2.0_h } };
200 | 
201 |         MeanTestImpl(input, axisDimensions, axisValues, keepDims, expectedOutput, true, armnn::Compute::GpuAcc);
202 |     }
203 | }
204 | #endif
205 | 


--------------------------------------------------------------------------------
/test/1.2/UnidirectionalSequenceLstm.cpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2022 Arm Ltd and Contributors. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #include "../UnidirectionalSequenceLstm.hpp"
 7 | 
 8 | using namespace armnn_driver;
 9 | 
10 | DOCTEST_TEST_SUITE("UnidirectionalSequenceLstmTests_1.2_CpuRef")
11 | {
12 | 
13 |     DOCTEST_TEST_CASE("UnidirectionalSequenceLstmLayerFloat32Test_1.2_CpuRef")
14 |     {
15 |         UnidirectionalSequenceLstmLayerFloat32TestImpl<hal_1_2::HalPolicy>(armnn::Compute::CpuRef);
16 |     }
17 | 
18 |     DOCTEST_TEST_CASE("UnidirectionalSequenceLstmLayerFloat32TimeMajorTest_1.2_CpuRef")
19 |     {
20 |         UnidirectionalSequenceLstmLayerFloat32TimeMajorTestImpl<hal_1_2::HalPolicy>(armnn::Compute::CpuRef);
21 |     }
22 | 
23 |     DOCTEST_TEST_CASE("UnidirectionalSequenceLstmLayerNoCifgWithPeepholeWithProjectionTest_1.2_CpuRef")
24 |     {
25 |         UnidirectionalSequenceLstmLayerNoCifgWithPeepholeWithProjectionTestImpl<hal_1_2::HalPolicy>
26 |             (armnn::Compute::CpuRef);
27 |     }
28 | 
29 |     DOCTEST_TEST_CASE("UnidirectionalSequenceLstmLayerNoCifgWithPeepholeWithProjectionWithLayerNormTest_1.2_CpuRef")
30 |     {
31 |         UnidirectionalSequenceLstmLayerNoCifgWithPeepholeWithProjectionWithLayerNormTestImpl<hal_1_2::HalPolicy>
32 |             (armnn::Compute::CpuRef);
33 |     }
34 | 
35 |     DOCTEST_TEST_CASE("UnidirectionalSequenceLstmWithCifgWithPeepholeNoProjectionTest_1.2_CpuRef")
36 |     {
37 |         UnidirectionalSequenceLstmWithCifgWithPeepholeNoProjectionTestImpl<hal_1_2::HalPolicy>(armnn::Compute::CpuRef);
38 |     }
39 | 
40 | }


--------------------------------------------------------------------------------
/test/1.3/QosTests.cpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2020 Arm Ltd and Contributors. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #include "../DriverTestHelpers.hpp"
  7 | 
  8 | #include <1.3/HalPolicy.hpp>
  9 | 
 10 | DOCTEST_TEST_SUITE("QosTests")
 11 | {
 12 | using ArmnnDriver   = armnn_driver::ArmnnDriver;
 13 | using DriverOptions = armnn_driver::DriverOptions;
 14 | 
 15 | using namespace android::nn;
 16 | using namespace android::hardware;
 17 | using namespace driverTestHelpers;
 18 | using namespace armnn_driver;
 19 | 
 20 | using HalPolicy = hal_1_3::HalPolicy;
 21 | 
 22 | namespace
 23 | {
 24 | 
 25 | void ExecuteModel(const armnn_driver::hal_1_3::HalPolicy::Model& model,
 26 |                   armnn_driver::ArmnnDriver& driver,
 27 |                   const V1_0::Request& request)
 28 | {
 29 |     android::sp<V1_3::IPreparedModel> preparedModel = PrepareModel_1_3(model, driver);
 30 |     if (preparedModel.get() != nullptr)
 31 |     {
 32 |         Execute(preparedModel, request);
 33 |     }
 34 | }
 35 | 
 36 | DOCTEST_TEST_CASE("ConcurrentExecuteWithQosPriority")
 37 | {
 38 |     ALOGI("ConcurrentExecuteWithQOSPriority: entry");
 39 | 
 40 |     auto driver = std::make_unique<ArmnnDriver>(DriverOptions(armnn::Compute::CpuRef));
 41 |     HalPolicy::Model model = {};
 42 | 
 43 |     // add operands
 44 |     int32_t actValue      = 0;
 45 |     float   weightValue[] = {2, 4, 1};
 46 |     float   biasValue[]   = {4};
 47 | 
 48 |     AddInputOperand<HalPolicy>(model, hidl_vec<uint32_t>{1, 3});
 49 |     AddTensorOperand<HalPolicy>(model,
 50 |                       hidl_vec<uint32_t>{1, 3},
 51 |                       weightValue,
 52 |                       HalPolicy::OperandType::TENSOR_FLOAT32,
 53 |                       V1_3::OperandLifeTime::CONSTANT_COPY);
 54 |     AddTensorOperand<HalPolicy>(model,
 55 |                       hidl_vec<uint32_t>{1},
 56 |                       biasValue,
 57 |                       HalPolicy::OperandType::TENSOR_FLOAT32,
 58 |                       V1_3::OperandLifeTime::CONSTANT_COPY);
 59 |     AddIntOperand<HalPolicy>(model, actValue);
 60 |     AddOutputOperand<HalPolicy>(model, hidl_vec<uint32_t>{1, 1});
 61 | 
 62 |     // make the fully connected operation
 63 |     model.main.operations.resize(1);
 64 |     model.main.operations[0].type    = HalPolicy::OperationType::FULLY_CONNECTED;
 65 |     model.main.operations[0].inputs  = hidl_vec<uint32_t>{0, 1, 2, 3};
 66 |     model.main.operations[0].outputs = hidl_vec<uint32_t>{4};
 67 | 
 68 |     // make the prepared models
 69 |     const size_t maxRequests = 45;
 70 |     size_t preparedModelsSize = 0;
 71 |     android::sp<V1_3::IPreparedModel> preparedModels[maxRequests];
 72 |     V1_3::ErrorStatus status(V1_3::ErrorStatus::NONE);
 73 |     size_t start = preparedModelsSize;
 74 |     for (size_t i = start; i < start+15; ++i)
 75 |     {
 76 |         preparedModels[i] = PrepareModelWithStatus_1_3(model, *driver, status, V1_3::Priority::LOW);
 77 |         preparedModelsSize++;
 78 |     }
 79 |     start = preparedModelsSize;
 80 |     for (size_t i = start; i < start+15; ++i)
 81 |     {
 82 |         preparedModels[i] = PrepareModelWithStatus_1_3(model, *driver, status, V1_3::Priority::MEDIUM);
 83 |         preparedModelsSize++;
 84 |     }
 85 |     start = preparedModelsSize;
 86 |     for (size_t i = start; i < start+15; ++i)
 87 |     {
 88 |         preparedModels[i] = PrepareModelWithStatus_1_3(model, *driver, status, V1_3::Priority::HIGH);
 89 |         preparedModelsSize++;
 90 |     }
 91 | 
 92 |     DOCTEST_CHECK(maxRequests == preparedModelsSize);
 93 | 
 94 |     // construct the request data
 95 |     V1_0::DataLocation inloc = {};
 96 |     inloc.poolIndex          = 0;
 97 |     inloc.offset             = 0;
 98 |     inloc.length             = 3 * sizeof(float);
 99 |     RequestArgument input    = {};
100 |     input.location           = inloc;
101 |     input.dimensions         = hidl_vec<uint32_t>{};
102 | 
103 |     V1_0::DataLocation outloc = {};
104 |     outloc.poolIndex          = 1;
105 |     outloc.offset             = 0;
106 |     outloc.length             = 1 * sizeof(float);
107 |     RequestArgument output    = {};
108 |     output.location           = outloc;
109 |     output.dimensions         = hidl_vec<uint32_t>{};
110 | 
111 |     // build the requests
112 |     V1_0::Request requests[maxRequests];
113 |     android::sp<IMemory> outMemory[maxRequests];
114 |     float* outdata[maxRequests];
115 |     for (size_t i = 0; i < maxRequests; ++i)
116 |     {
117 |         requests[i].inputs  = hidl_vec<RequestArgument>{input};
118 |         requests[i].outputs = hidl_vec<RequestArgument>{output};
119 |         // set the input data (matching source test)
120 |         float inDataLow[] = {2, 32, 16};
121 |         float inDataMedium[] = {1, 31, 11};
122 |         float inDataHigh[] = {3, 33, 17};
123 |         if (i < 15)
124 |         {
125 |             AddPoolAndSetData<float>(3, requests[i], inDataLow);
126 |         }
127 |         else if (i < 30)
128 |         {
129 |             AddPoolAndSetData<float>(3, requests[i], inDataMedium);
130 |         }
131 |         else
132 |         {
133 |             AddPoolAndSetData<float>(3, requests[i], inDataHigh);
134 |         }
135 |         // add memory for the output
136 |         outMemory[i] = AddPoolAndGetData<float>(1, requests[i]);
137 |         outdata[i] = static_cast<float*>(static_cast<void*>(outMemory[i]->getPointer()));
138 |     }
139 | 
140 |     // invoke the execution of the requests
141 |     ALOGI("ConcurrentExecuteWithQOSPriority: executing requests");
142 |     android::sp<ExecutionCallback> cb[maxRequests];
143 |     for (size_t i = 0; i < maxRequests; ++i)
144 |     {
145 |         cb[i] = ExecuteNoWait(preparedModels[i], requests[i]);
146 |     }
147 | 
148 |     // wait for the requests to complete
149 |     ALOGI("ConcurrentExecuteWithQOSPriority: waiting for callbacks");
150 |     for (size_t i = 0; i < maxRequests; ++i)
151 |     {
152 |         DOCTEST_CHECK(cb[i]);
153 |         cb[i]->wait();
154 |     }
155 | 
156 |     // check the results
157 |     ALOGI("ConcurrentExecuteWithQOSPriority: validating results");
158 |     for (size_t i = 0; i < maxRequests; ++i)
159 |     {
160 |         if (i < 15)
161 |         {
162 |             DOCTEST_CHECK(outdata[i][0] == 152);
163 |         }
164 |         else if (i < 30)
165 |         {
166 |             DOCTEST_CHECK(outdata[i][0] == 141);
167 |         }
168 |         else
169 |         {
170 |             DOCTEST_CHECK(outdata[i][0] == 159);
171 |         }
172 | 
173 |     }
174 |     ALOGI("ConcurrentExecuteWithQOSPriority: exit");
175 | }
176 | 
177 | } // anonymous namespace
178 | 
179 | }


--------------------------------------------------------------------------------
/test/Concurrent.cpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #include "DriverTestHelpers.hpp"
  7 | 
  8 | #include <log/log.h>
  9 | 
 10 | DOCTEST_TEST_SUITE("ConcurrentDriverTests")
 11 | {
 12 | using ArmnnDriver   = armnn_driver::ArmnnDriver;
 13 | using DriverOptions = armnn_driver::DriverOptions;
 14 | using HalPolicy     = armnn_driver::hal_1_0::HalPolicy;
 15 | using RequestArgument = V1_0::RequestArgument;
 16 | 
 17 | using namespace android::nn;
 18 | using namespace android::hardware;
 19 | using namespace driverTestHelpers;
 20 | using namespace armnn_driver;
 21 | 
 22 | // Add our own test for concurrent execution
 23 | // The main point of this test is to check that multiple requests can be
 24 | // executed without waiting for the callback from previous execution.
 25 | // The operations performed are not significant.
 26 | DOCTEST_TEST_CASE("ConcurrentExecute")
 27 | {
 28 |     ALOGI("ConcurrentExecute: entry");
 29 | 
 30 |     auto driver = std::make_unique<ArmnnDriver>(DriverOptions(armnn::Compute::CpuRef));
 31 |     HalPolicy::Model model = {};
 32 | 
 33 |     // add operands
 34 |     int32_t actValue      = 0;
 35 |     float   weightValue[] = {2, 4, 1};
 36 |     float   biasValue[]   = {4};
 37 | 
 38 |     AddInputOperand<HalPolicy>(model, hidl_vec<uint32_t>{1, 3});
 39 |     AddTensorOperand<HalPolicy>(model, hidl_vec<uint32_t>{1, 3}, weightValue);
 40 |     AddTensorOperand<HalPolicy>(model, hidl_vec<uint32_t>{1}, biasValue);
 41 |     AddIntOperand<HalPolicy>(model, actValue);
 42 |     AddOutputOperand<HalPolicy>(model, hidl_vec<uint32_t>{1, 1});
 43 | 
 44 |     // make the fully connected operation
 45 |     model.operations.resize(1);
 46 |     model.operations[0].type    = HalPolicy::OperationType::FULLY_CONNECTED;
 47 |     model.operations[0].inputs  = hidl_vec<uint32_t>{0, 1, 2, 3};
 48 |     model.operations[0].outputs = hidl_vec<uint32_t>{4};
 49 | 
 50 |     // make the prepared models
 51 |     const size_t maxRequests = 5;
 52 |     size_t preparedModelsSize = 0;
 53 |     android::sp<V1_0::IPreparedModel> preparedModels[maxRequests];
 54 |     for (size_t i = 0; i < maxRequests; ++i)
 55 |     {
 56 |         auto preparedModel = PrepareModel(model, *driver);
 57 |         if (preparedModel.get() != nullptr)
 58 |         {
 59 |             preparedModels[i] = PrepareModel(model, *driver);
 60 |             preparedModelsSize++;
 61 |         }
 62 |     }
 63 | 
 64 |     DOCTEST_CHECK(maxRequests == preparedModelsSize);
 65 | 
 66 |     // construct the request data
 67 |     V1_0::DataLocation inloc = {};
 68 |     inloc.poolIndex          = 0;
 69 |     inloc.offset             = 0;
 70 |     inloc.length             = 3 * sizeof(float);
 71 |     RequestArgument input    = {};
 72 |     input.location           = inloc;
 73 |     input.dimensions         = hidl_vec<uint32_t>{};
 74 | 
 75 |     V1_0::DataLocation outloc = {};
 76 |     outloc.poolIndex          = 1;
 77 |     outloc.offset             = 0;
 78 |     outloc.length             = 1 * sizeof(float);
 79 |     RequestArgument output    = {};
 80 |     output.location           = outloc;
 81 |     output.dimensions         = hidl_vec<uint32_t>{};
 82 | 
 83 |     // build the requests
 84 |     V1_0::Request requests[maxRequests];
 85 |     android::sp<IMemory> inMemory[maxRequests];
 86 |     android::sp<IMemory> outMemory[maxRequests];
 87 |     float indata[] = {2, 32, 16};
 88 |     float* outdata[maxRequests];
 89 |     for (size_t i = 0; i < maxRequests; ++i)
 90 |     {
 91 |         requests[i].inputs  = hidl_vec<RequestArgument>{input};
 92 |         requests[i].outputs = hidl_vec<RequestArgument>{output};
 93 |         // set the input data (matching source test)
 94 |         inMemory[i] = AddPoolAndSetData<float>(3, requests[i], indata);
 95 |         // add memory for the output
 96 |         outMemory[i] = AddPoolAndGetData<float>(1, requests[i]);
 97 |         outdata[i] = static_cast<float*>(static_cast<void*>(outMemory[i]->getPointer()));
 98 |     }
 99 | 
100 |     // invoke the execution of the requests
101 |     ALOGI("ConcurrentExecute: executing requests");
102 |     android::sp<ExecutionCallback> cb[maxRequests];
103 |     for (size_t i = 0; i < maxRequests; ++i)
104 |     {
105 |         cb[i] = ExecuteNoWait(preparedModels[i], requests[i]);
106 |     }
107 | 
108 |     // wait for the requests to complete
109 |     ALOGI("ConcurrentExecute: waiting for callbacks");
110 |     for (size_t i = 0; i < maxRequests; ++i)
111 |     {
112 |         DOCTEST_CHECK(cb[i]);
113 |         cb[i]->wait();
114 |     }
115 | 
116 |     // check the results
117 |     ALOGI("ConcurrentExecute: validating results");
118 |     for (size_t i = 0; i < maxRequests; ++i)
119 |     {
120 |         DOCTEST_CHECK(outdata[i][0] == 152);
121 |     }
122 |     ALOGI("ConcurrentExecute: exit");
123 | }
124 | 
125 | }
126 | 


--------------------------------------------------------------------------------
/test/Convolution2D.hpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #pragma once
  7 | 
  8 | #include "DriverTestHelpers.hpp"
  9 | 
 10 | #include <log/log.h>
 11 | 
 12 | #include <OperationsUtils.h>
 13 | 
 14 | using namespace android::hardware;
 15 | using namespace driverTestHelpers;
 16 | using namespace armnn_driver;
 17 | 
 18 | using RequestArgument = V1_0::RequestArgument;
 19 | 
 20 | namespace driverTestHelpers
 21 | {
 22 | #define ARMNN_ANDROID_FP16_TEST(result, fp16Expectation, fp32Expectation, fp16Enabled) \
 23 |    if (fp16Enabled) \
 24 |    { \
 25 |        DOCTEST_CHECK_MESSAGE((result == fp16Expectation || result == fp32Expectation), result << \
 26 |        " does not match either " << fp16Expectation << "[fp16] or " << fp32Expectation << "[fp32]"); \
 27 |    } else \
 28 |    { \
 29 |       DOCTEST_CHECK(result == fp32Expectation); \
 30 |    }
 31 | 
 32 | void SetModelFp16Flag(V1_0::Model& model, bool fp16Enabled);
 33 | 
 34 | void SetModelFp16Flag(V1_1::Model& model, bool fp16Enabled);
 35 | 
 36 | template<typename HalPolicy>
 37 | void PaddingTestImpl(android::nn::PaddingScheme paddingScheme, bool fp16Enabled = false)
 38 | {
 39 |     using HalModel         = typename HalPolicy::Model;
 40 |     using HalOperationType = typename HalPolicy::OperationType;
 41 | 
 42 |     armnn::Compute computeDevice = armnn::Compute::GpuAcc;
 43 | 
 44 | #ifndef ARMCOMPUTECL_ENABLED
 45 |     computeDevice = armnn::Compute::CpuRef;
 46 | #endif
 47 | 
 48 |     auto driver = std::make_unique<ArmnnDriver>(DriverOptions(computeDevice, fp16Enabled));
 49 |     HalModel model = {};
 50 | 
 51 |     uint32_t outSize = paddingScheme == android::nn::kPaddingSame ? 2 : 1;
 52 | 
 53 |     // add operands
 54 |     float weightValue[] = {1.f, -1.f, 0.f, 1.f};
 55 |     float biasValue[] = {0.f};
 56 | 
 57 |     AddInputOperand<HalPolicy>(model, hidl_vec < uint32_t > {1, 2, 3, 1});
 58 |     AddTensorOperand<HalPolicy>(model, hidl_vec < uint32_t > {1, 2, 2, 1}, weightValue);
 59 |     AddTensorOperand<HalPolicy>(model, hidl_vec < uint32_t > {1}, biasValue);
 60 |     AddIntOperand<HalPolicy>(model, (int32_t) paddingScheme); // padding
 61 |     AddIntOperand<HalPolicy>(model, 2); // stride x
 62 |     AddIntOperand<HalPolicy>(model, 2); // stride y
 63 |     AddIntOperand<HalPolicy>(model, 0); // no activation
 64 |     AddOutputOperand<HalPolicy>(model, hidl_vec < uint32_t > {1, 1, outSize, 1});
 65 | 
 66 |     // make the convolution operation
 67 |     model.operations.resize(1);
 68 |     model.operations[0].type = HalOperationType::CONV_2D;
 69 |     model.operations[0].inputs = hidl_vec < uint32_t > {0, 1, 2, 3, 4, 5, 6};
 70 |     model.operations[0].outputs = hidl_vec < uint32_t > {7};
 71 | 
 72 |     // make the prepared model
 73 |     SetModelFp16Flag(model, fp16Enabled);
 74 |     android::sp<V1_0::IPreparedModel> preparedModel = PrepareModel(model, *driver);
 75 | 
 76 |     // construct the request
 77 |     V1_0::DataLocation inloc = {};
 78 |     inloc.poolIndex = 0;
 79 |     inloc.offset = 0;
 80 |     inloc.length = 6 * sizeof(float);
 81 |     RequestArgument input = {};
 82 |     input.location = inloc;
 83 |     input.dimensions = hidl_vec < uint32_t > {};
 84 | 
 85 |     V1_0::DataLocation outloc = {};
 86 |     outloc.poolIndex = 1;
 87 |     outloc.offset = 0;
 88 |     outloc.length = outSize * sizeof(float);
 89 |     RequestArgument output = {};
 90 |     output.location = outloc;
 91 |     output.dimensions = hidl_vec < uint32_t > {};
 92 | 
 93 |     V1_0::Request request = {};
 94 |     request.inputs = hidl_vec < RequestArgument > {input};
 95 |     request.outputs = hidl_vec < RequestArgument > {output};
 96 | 
 97 |     // set the input data (matching source test)
 98 |     float indata[] = {1024.25f, 1.f, 0.f, 3.f, -1, -1024.25f};
 99 |     AddPoolAndSetData(6, request, indata);
100 | 
101 |     // add memory for the output
102 |     android::sp<IMemory> outMemory = AddPoolAndGetData<float>(outSize, request);
103 |     float* outdata = reinterpret_cast<float*>(static_cast<void*>(outMemory->getPointer()));
104 | 
105 |     // run the execution
106 |     if (preparedModel.get() != nullptr)
107 |     {
108 |         Execute(preparedModel, request);
109 |     }
110 | 
111 |     // check the result
112 |     switch (paddingScheme)
113 |     {
114 |         case android::nn::kPaddingValid:
115 |             ARMNN_ANDROID_FP16_TEST(outdata[0], 1022.f, 1022.25f, fp16Enabled)
116 |             break;
117 |         case android::nn::kPaddingSame:
118 |             ARMNN_ANDROID_FP16_TEST(outdata[0], 1022.f, 1022.25f, fp16Enabled)
119 |             DOCTEST_CHECK(outdata[1] == 0.f);
120 |             break;
121 |         default:
122 |             DOCTEST_CHECK(false);
123 |             break;
124 |     }
125 | }
126 | 
127 | } // namespace driverTestHelpers
128 | 


--------------------------------------------------------------------------------
/test/Dilation.hpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
  3 | // SPDX-License-Identifier: MIT
  4 | //
  5 | 
  6 | #pragma once
  7 | 
  8 | #include "DriverTestHelpers.hpp"
  9 | 
 10 | #include <armnn/StrategyBase.hpp>
 11 | #include <armnn/utility/IgnoreUnused.hpp>
 12 | 
 13 | #include <numeric>
 14 | 
 15 | using namespace armnn;
 16 | using namespace driverTestHelpers;
 17 | 
 18 | struct DilationTestOptions
 19 | {
 20 |     DilationTestOptions() :
 21 |         m_IsDepthwiseConvolution{false},
 22 |         m_IsPaddingExplicit{false},
 23 |         m_HasDilation{false}
 24 |     {}
 25 | 
 26 |     ~DilationTestOptions() = default;
 27 | 
 28 |     bool m_IsDepthwiseConvolution;
 29 |     bool m_IsPaddingExplicit;
 30 |     bool m_HasDilation;
 31 | };
 32 | 
 33 | class DilationTestVisitor : public StrategyBase<ThrowingStrategy>
 34 | {
 35 | public:
 36 |     DilationTestVisitor() :
 37 |         DilationTestVisitor(1u, 1u)
 38 |     {}
 39 | 
 40 |     DilationTestVisitor(uint32_t expectedDilationX, uint32_t expectedDilationY) :
 41 |         m_ExpectedDilationX{expectedDilationX},
 42 |         m_ExpectedDilationY{expectedDilationY}
 43 |     {}
 44 | 
 45 |     void ExecuteStrategy(const armnn::IConnectableLayer* layer,
 46 |                          const armnn::BaseDescriptor& descriptor,
 47 |                          const std::vector<armnn::ConstTensor>& constants,
 48 |                          const char* name,
 49 |                          const armnn::LayerBindingId id = 0) override
 50 |     {
 51 |         armnn::IgnoreUnused(layer, constants, id, name);
 52 |         switch (layer->GetType())
 53 |         {
 54 |             case armnn::LayerType::Constant:
 55 |                 break;
 56 |             case armnn::LayerType::Convolution2d:
 57 |             {
 58 |                 CheckDilationParams(static_cast<const armnn::Convolution2dDescriptor&>(descriptor));
 59 |                 break;
 60 |             }
 61 |             case armnn::LayerType::DepthwiseConvolution2d:
 62 |             {
 63 |                 CheckDilationParams(static_cast<const armnn::DepthwiseConvolution2dDescriptor&>(descriptor));
 64 |                 break;
 65 |             }
 66 |             default:
 67 |             {
 68 |                 m_DefaultStrategy.Apply(GetLayerTypeAsCString(layer->GetType()));
 69 |             }
 70 |         }
 71 |     }
 72 | 
 73 | private:
 74 |     uint32_t m_ExpectedDilationX;
 75 |     uint32_t m_ExpectedDilationY;
 76 | 
 77 |     template<typename ConvolutionDescriptor>
 78 |     void CheckDilationParams(const ConvolutionDescriptor& descriptor)
 79 |     {
 80 |         CHECK_EQ(descriptor.m_DilationX, m_ExpectedDilationX);
 81 |         CHECK_EQ(descriptor.m_DilationY, m_ExpectedDilationY);
 82 |     }
 83 | };
 84 | 
 85 | template<typename HalPolicy>
 86 | void DilationTestImpl(const DilationTestOptions& options)
 87 | {
 88 |     using HalModel         = typename HalPolicy::Model;
 89 |     using HalOperationType = typename HalPolicy::OperationType;
 90 | 
 91 |     const armnn::Compute backend = armnn::Compute::CpuRef;
 92 |     auto driver = std::make_unique<ArmnnDriver>(DriverOptions(backend, false));
 93 |     HalModel model = {};
 94 | 
 95 |     // add operands
 96 |     std::vector<float> weightData(9, 1.0f);
 97 |     std::vector<float> biasData(1, 0.0f );
 98 | 
 99 |     // input
100 |     AddInputOperand<HalPolicy>(model, hidl_vec<uint32_t>{1, 3, 3, 1});
101 | 
102 |     // weights & biases
103 |     AddTensorOperand<HalPolicy>(model, hidl_vec<uint32_t>{1, 3, 3, 1}, weightData.data());
104 |     AddTensorOperand<HalPolicy>(model, hidl_vec<uint32_t>{1}, biasData.data());
105 | 
106 |     uint32_t numInputs = 3u;
107 |     // padding
108 |     if (options.m_IsPaddingExplicit)
109 |     {
110 |         AddIntOperand<HalPolicy>(model, 1);
111 |         AddIntOperand<HalPolicy>(model, 1);
112 |         AddIntOperand<HalPolicy>(model, 1);
113 |         AddIntOperand<HalPolicy>(model, 1);
114 |         numInputs += 4;
115 |     }
116 |     else
117 |     {
118 |         AddIntOperand<HalPolicy>(model, android::nn::kPaddingSame);
119 |         numInputs += 1;
120 |     }
121 | 
122 |     AddIntOperand<HalPolicy>(model, 2); // stride x
123 |     AddIntOperand<HalPolicy>(model, 2); // stride y
124 |     numInputs += 2;
125 | 
126 |     if (options.m_IsDepthwiseConvolution)
127 |     {
128 |         AddIntOperand<HalPolicy>(model, 1); // depth multiplier
129 |         numInputs++;
130 |     }
131 | 
132 |     AddIntOperand<HalPolicy>(model, 0); // no activation
133 |     numInputs += 1;
134 | 
135 |     // dilation
136 |     if (options.m_HasDilation)
137 |     {
138 |         AddBoolOperand<HalPolicy>(model, false); // default data layout
139 | 
140 |         AddIntOperand<HalPolicy>(model, 2); // dilation X
141 |         AddIntOperand<HalPolicy>(model, 2); // dilation Y
142 | 
143 |         numInputs += 3;
144 |     }
145 | 
146 |     // output
147 |     AddOutputOperand<HalPolicy>(model, hidl_vec<uint32_t>{1, 1, 1, 1});
148 | 
149 |     // set up the convolution operation
150 |     model.operations.resize(1);
151 |     model.operations[0].type = options.m_IsDepthwiseConvolution ?
152 |         HalOperationType::DEPTHWISE_CONV_2D : HalOperationType::CONV_2D;
153 | 
154 |     std::vector<uint32_t> inputs(numInputs);
155 |     std::iota(inputs.begin(), inputs.end(), 0u);
156 |     std::vector<uint32_t> outputs = { numInputs };
157 | 
158 |     model.operations[0].inputs  = hidl_vec<uint32_t>(inputs);
159 |     model.operations[0].outputs = hidl_vec<uint32_t>(outputs);
160 | 
161 |     // convert model
162 |     ConversionData data({backend});
163 |     data.m_Network = armnn::INetwork::Create();
164 |     data.m_OutputSlotForOperand = std::vector<IOutputSlot*>(model.operands.size(), nullptr);
165 | 
166 |     bool ok = HalPolicy::ConvertOperation(model.operations[0], model, data);
167 |     DOCTEST_CHECK(ok);
168 | 
169 |     // check if dilation params are as expected
170 |     DilationTestVisitor visitor = options.m_HasDilation ? DilationTestVisitor(2, 2) : DilationTestVisitor();
171 |     data.m_Network->ExecuteStrategy(visitor);
172 | }
173 | 


--------------------------------------------------------------------------------
/test/SystemProperties.cpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #include "DriverTestHelpers.hpp"
 7 | #include <log/log.h>
 8 | #include <SystemPropertiesUtils.hpp>
 9 | 
10 | DOCTEST_TEST_SUITE("SystemProperiesTests")
11 | {
12 | 
13 | DOCTEST_TEST_CASE("SystemProperties")
14 | {
15 |     // Test default value
16 |     {
17 |         auto p = __system_property_find("thisDoesNotExist");
18 |         DOCTEST_CHECK((p == nullptr));
19 | 
20 |         int defaultValue = ParseSystemProperty("thisDoesNotExist", -4);
21 |         DOCTEST_CHECK((defaultValue == -4));
22 |     }
23 | 
24 |     //  Test default value from bad data type
25 |     {
26 |         __system_property_set("thisIsNotFloat", "notfloat");
27 |         float defaultValue = ParseSystemProperty("thisIsNotFloat", 0.1f);
28 |         DOCTEST_CHECK((defaultValue == 0.1f));
29 |     }
30 | 
31 |     // Test fetching bool values
32 |     {
33 |         __system_property_set("myTestBool", "1");
34 |         bool b = ParseSystemProperty("myTestBool", false);
35 |         DOCTEST_CHECK((b == true));
36 |     }
37 |     {
38 |         __system_property_set("myTestBool", "0");
39 |         bool b = ParseSystemProperty("myTestBool", true);
40 |         DOCTEST_CHECK((b == false));
41 |     }
42 | 
43 |     // Test fetching int
44 |     {
45 |         __system_property_set("myTestInt", "567");
46 |         int i = ParseSystemProperty("myTestInt", 890);
47 |         DOCTEST_CHECK((i==567));
48 |     }
49 | 
50 |     // Test fetching float
51 |     {
52 |         __system_property_set("myTestFloat", "1.2f");
53 |         float f = ParseSystemProperty("myTestFloat", 3.4f);
54 |         DOCTEST_CHECK((f==1.2f));
55 |     }
56 | }
57 | 
58 | }
59 | 


--------------------------------------------------------------------------------
/test/TestHalfTensor.cpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2022 Arm Ltd and Contributors. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #include "TestHalfTensor.hpp"
 7 | 
 8 | namespace driverTestHelpers
 9 | {
10 | 
11 | hidl_vec<uint32_t> TestHalfTensor::GetDimensions() const
12 | {
13 |     hidl_vec<uint32_t> dimensions;
14 |     dimensions.resize(m_Shape.GetNumDimensions());
15 |     for (uint32_t i=0; i<m_Shape.GetNumDimensions(); ++i)
16 |     {
17 |         dimensions[i] = m_Shape[i];
18 |     }
19 |     return dimensions;
20 | }
21 | 
22 | unsigned int TestHalfTensor::GetNumElements() const
23 | {
24 |     return m_Shape.GetNumElements();
25 | }
26 | 
27 | const Half * TestHalfTensor::GetData() const
28 | {
29 |     DOCTEST_CHECK(m_Data.empty() == false);
30 |     return &m_Data[0];
31 | }
32 | 
33 | } // namespace driverTestHelpers
34 | 


--------------------------------------------------------------------------------
/test/TestHalfTensor.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2022 Arm Ltd and Contributors. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #pragma once
 7 | 
 8 | #include <ArmnnDriver.hpp>
 9 | #include "DriverTestHelpers.hpp"
10 | 
11 | #include <half/half.hpp>
12 | 
13 | using Half = half_float::half;
14 | 
15 | namespace driverTestHelpers
16 | {
17 | 
18 | class TestHalfTensor
19 | {
20 | public:
21 |     TestHalfTensor(const armnn::TensorShape & shape,
22 |                const std::vector<Half> & data)
23 |         : m_Shape{shape}
24 |         , m_Data{data}
25 |     {
26 |         DOCTEST_CHECK(m_Shape.GetNumElements() == m_Data.size());
27 |     }
28 | 
29 |     hidl_vec<uint32_t> GetDimensions() const;
30 |     unsigned int GetNumElements() const;
31 |     const Half * GetData() const;
32 | 
33 | private:
34 |     armnn::TensorShape   m_Shape;
35 |     std::vector<Half>   m_Data;
36 | };
37 | 
38 | } // driverTestHelpers
39 | 


--------------------------------------------------------------------------------
/test/TestTensor.cpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #include "TestTensor.hpp"
 7 | 
 8 | namespace driverTestHelpers
 9 | {
10 | 
11 | hidl_vec<uint32_t> TestTensor::GetDimensions() const
12 | {
13 |     hidl_vec<uint32_t> dimensions;
14 |     dimensions.resize(m_Shape.GetNumDimensions());
15 |     for (uint32_t i=0; i<m_Shape.GetNumDimensions(); ++i)
16 |     {
17 |         dimensions[i] = m_Shape[i];
18 |     }
19 |     return dimensions;
20 | }
21 | 
22 | unsigned int TestTensor::GetNumElements() const
23 | {
24 |     return m_Shape.GetNumElements();
25 | }
26 | 
27 | const float * TestTensor::GetData() const
28 | {
29 |     DOCTEST_CHECK(m_Data.empty() == false);
30 |     return &m_Data[0];
31 | }
32 | 
33 | } // namespace driverTestHelpers
34 | 


--------------------------------------------------------------------------------
/test/TestTensor.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #pragma once
 7 | 
 8 | #include <ArmnnDriver.hpp>
 9 | #include "DriverTestHelpers.hpp"
10 | 
11 | namespace driverTestHelpers
12 | {
13 | 
14 | class TestTensor
15 | {
16 | public:
17 |     TestTensor(const armnn::TensorShape & shape,
18 |                const std::vector<float> & data)
19 |     : m_Shape{shape}
20 |     , m_Data{data}
21 |     {
22 |         DOCTEST_CHECK(m_Shape.GetNumElements() == m_Data.size());
23 |     }
24 | 
25 |     hidl_vec<uint32_t> GetDimensions() const;
26 |     unsigned int GetNumElements() const;
27 |     const float * GetData() const;
28 | 
29 | private:
30 |     armnn::TensorShape   m_Shape;
31 |     std::vector<float>   m_Data;
32 | };
33 | 
34 | } // driverTestHelpers
35 | 


--------------------------------------------------------------------------------
/test/Tests.cpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
 3 | // SPDX-License-Identifier: MIT
 4 | //
 5 | 
 6 | #define LOG_TAG "ArmnnDriverTests"
 7 | #include <log/log.h>
 8 | 
 9 | #ifndef DOCTEST_CONFIG_IMPLEMENT_WITH_MAIN
10 | #define DOCTEST_CONFIG_IMPLEMENT_WITH_MAIN
11 | #endif
12 | 
13 | #include "DriverTestHelpers.hpp"
14 | 
15 | using namespace android::hardware;
16 | using namespace driverTestHelpers;
17 | using namespace armnn_driver;
18 | 
19 | DOCTEST_TEST_SUITE("DriverTests")
20 | {
21 | 
22 | DOCTEST_TEST_CASE("Init")
23 | {
24 |     // Making the driver object on the stack causes a weird libc error, so make it on the heap instead
25 |     auto driver = std::make_unique<ArmnnDriver>(DriverOptions(armnn::Compute::CpuRef));
26 | 
27 |     V1_0::DeviceStatus status = driver->getStatus();
28 |     // Note double-parentheses to avoid compile error from doctest trying to printf the DeviceStatus
29 |     DOCTEST_CHECK((status == V1_0::DeviceStatus::AVAILABLE));
30 | }
31 | 
32 | DOCTEST_TEST_CASE("TestCapabilities")
33 | {
34 |     // Making the driver object on the stack causes a weird libc error, so make it on the heap instead
35 |     auto driver = std::make_unique<ArmnnDriver>(DriverOptions(armnn::Compute::CpuRef));
36 | 
37 |     V1_0::ErrorStatus error;
38 |     V1_0::Capabilities cap;
39 | 
40 |     auto cb = [&](V1_0::ErrorStatus status, const V1_0::Capabilities& capabilities)
41 |     {
42 |         error = status;
43 |         cap = capabilities;
44 |     };
45 | 
46 |     driver->getCapabilities(cb);
47 | 
48 |     DOCTEST_CHECK((int)error == (int)V1_0::ErrorStatus::NONE);
49 |     DOCTEST_CHECK(cap.float32Performance.execTime > 0.f);
50 |     DOCTEST_CHECK(cap.float32Performance.powerUsage > 0.f);
51 |     DOCTEST_CHECK(cap.quantized8Performance.execTime > 0.f);
52 |     DOCTEST_CHECK(cap.quantized8Performance.powerUsage > 0.f);
53 | }
54 | 
55 | }
56 | 


--------------------------------------------------------------------------------