/*
* Copyright (C) 2017 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#ifndef ANDROID_ML_NN_RUNTIME_MANAGER_H
#define ANDROID_ML_NN_RUNTIME_MANAGER_H
#include "HalInterfaces.h"
#include "Utils.h"
#include "VersionedIDevice.h"
#include <android-base/macros.h>
#include <map>
#include <unordered_set>
#include <vector>
namespace android {
namespace nn {
class ModelBuilder;
class Device {
DISALLOW_IMPLICIT_CONSTRUCTORS(Device);
public:
Device(std::string name, const sp<V1_0::IDevice>& device);
VersionedIDevice* getInterface() { return &mInterface; }
const std::string& getName() const { return mName; }
// Returns true if succesfully initialized.
bool initialize();
void getSupportedOperations(const Model& hidlModel, hidl_vec<bool>* supportedOperations);
PerformanceInfo getFloat32Performance() const { return mFloat32Performance; }
PerformanceInfo getQuantized8Performance() const { return mQuantized8Performance; }
PerformanceInfo getRelaxedFloat32toFloat16Performance() const {
return mRelaxedFloat32toFloat16Performance;
}
private:
std::string mName;
VersionedIDevice mInterface;
PerformanceInfo mFloat32Performance;
PerformanceInfo mQuantized8Performance;
PerformanceInfo mRelaxedFloat32toFloat16Performance;
#ifdef NN_DEBUGGABLE
// For debugging: behavior of IDevice::getSupportedOperations for SampleDriver.
// 0 - all operations reported by IDevice::getSupportedOperations() supported
// 1 - some operations reported by IDevice::getSupportedOperations() supported
uint32_t mSupported = 0;
#endif // NN_DEBUGGABLE
};
// Manages the NN HAL devices. Only one instance of this class will exist.
// Use get() to retrieve it.
class DeviceManager {
public:
const std::vector<std::shared_ptr<Device>>& getDrivers() const {
if (mSetCpuOnly || mDebugNNCpuOnly) {
return mNoDevices;
}
return mDevices;
}
// For testing only:
void setUseCpuOnly(bool useCpuOnly) { mSetCpuOnly = useCpuOnly; }
// How to handle graph partitioning?
// 0 - Don't do graph partitioning.
// 1 - Do graph partitioning; but fall back to non-partitioned
// execution if there is a partitioning failure.
// 2 - Do graph partitioning, and rely on it; there is no fallback.
enum {
kPartitioningNo = 0,
kPartitioningWithFallback = 1,
kPartitioningWithoutFallback = 2
};
uint32_t getPartitioning() const { return mPartitioning; }
static bool partitioningAllowsFallback(uint32_t partitioning) {
return partitioning == kPartitioningWithFallback;
}
// Returns the singleton manager.
static DeviceManager* get();
private:
// Builds the list of available drivers and queries their capabilities.
DeviceManager();
// Adds a device for the manager to use.
void registerDevice(const char* name, const sp<V1_0::IDevice>& device);
void findAvailableDevices();
// List of all the devices we discovered.
std::vector<std::shared_ptr<Device>> mDevices;
// We leave this one always empty. To be used when mUseCpuOnly is true.
std::vector<std::shared_ptr<Device>> mNoDevices;
// If either of these is true, we'll ignore the drivers that are
// on the device and run everything on the CPU.
bool mSetCpuOnly = false; // set by setUseCpuOnly()
bool mDebugNNCpuOnly = false; // derived from system property debug.nn.cpuonly
static const uint32_t kPartitioningDefault = kPartitioningWithFallback;
uint32_t mPartitioning = kPartitioningDefault;
};
} // namespace nn
} // namespace android
#endif // ANDROID_ML_NN_RUNTIME_MANAGER_H