#include "HybridTfliteModel.hpp" #include "TfliteHelpers.hpp" #include #include #include #if defined(ANDROID) #include #elif defined(__APPLE__) #include #else #error "Invalid Platform!" #endif namespace margelo::nitro::tflite { HybridTfliteModel::HybridTfliteModel(TfLiteInterpreter* interpreter, std::shared_ptr modelData, std::vector delegates) : HybridObject(TAG), _interpreter(interpreter), _delegates(std::move(delegates)), _modelData(modelData) { TfLiteStatus status = TfLiteInterpreterAllocateTensors(_interpreter); if (status != kTfLiteOk) { throw std::runtime_error( "TFLite: Failed to allocate memory for input/output tensors! Status: " + tfLiteStatusToString(status)); } } HybridTfliteModel::~HybridTfliteModel() { if (_interpreter != nullptr) { TfLiteInterpreterDelete(_interpreter); _interpreter = nullptr; } // _modelData (shared_ptr) is automatically freed } std::vector HybridTfliteModel::getDelegates() { return _delegates; } std::vector HybridTfliteModel::getInputs() { int count = TfLiteInterpreterGetInputTensorCount(_interpreter); std::vector tensors; tensors.reserve(count); for (int32_t i = 0; i < count; i++) { TfLiteTensor* tensor = TfLiteInterpreterGetInputTensor(_interpreter, i); if (tensor == nullptr) { throw std::runtime_error("TFLite: Failed to get input tensor " + std::to_string(i) + "!"); } int dimensions = TfLiteTensorNumDims(tensor); std::vector shape; shape.reserve(dimensions); for (int32_t d = 0; d < dimensions; d++) { int32_t size = TfLiteTensorDim(tensor, d); shape.push_back(static_cast(size)); } tensors.push_back(Tensor(std::string(TfLiteTensorName(tensor)), getTensorDataType(TfLiteTensorType(tensor)), std::move(shape))); } return tensors; } std::vector HybridTfliteModel::getOutputs() { int count = TfLiteInterpreterGetOutputTensorCount(_interpreter); std::vector tensors; tensors.reserve(count); for (int32_t i = 0; i < count; i++) { const TfLiteTensor* tensor = TfLiteInterpreterGetOutputTensor(_interpreter, i); if (tensor == nullptr) { throw std::runtime_error("TFLite: Failed to get output tensor " + std::to_string(i) + "!"); } int dimensions = TfLiteTensorNumDims(tensor); std::vector shape; shape.reserve(dimensions); for (int32_t d = 0; d < dimensions; d++) { int32_t size = TfLiteTensorDim(tensor, d); shape.push_back(static_cast(size)); } tensors.push_back(Tensor(std::string(TfLiteTensorName(tensor)), getTensorDataType(TfLiteTensorType(tensor)), std::move(shape))); } return tensors; } void HybridTfliteModel::copyInputBuffers(const std::vector>& input) { size_t inputCount = TfLiteInterpreterGetInputTensorCount(_interpreter); if (input.size() != inputCount) [[unlikely]] { throw std::runtime_error("TFLite: Input array size (" + std::to_string(input.size()) + ") does not match input tensor count (" + std::to_string(inputCount) + ")!"); } for (int32_t i = 0; i < inputCount; i++) { TfLiteTensor* tensor = TfLiteInterpreterGetInputTensor(_interpreter, i); const std::shared_ptr& buffer = input[i]; TfLiteTensorCopyFromBuffer(tensor, buffer->data(), buffer->size()); } } // Pre-allocates a buffer per output tensor, reuses on subsequent calls. std::shared_ptr HybridTfliteModel::getOutputBufferForTensor(const TfLiteTensor* tensor) { std::string name = TfLiteTensorName(tensor); if (_outputBuffers.find(name) == _outputBuffers.end()) { TfLiteType dataType = TfLiteTensorType(tensor); int totalLength = getTensorTotalLength(tensor); size_t byteSize = totalLength * getTFLTensorDataTypeSize(dataType); _outputBuffers[name] = ArrayBuffer::allocate(byteSize); } return _outputBuffers[name]; } std::vector> HybridTfliteModel::copyOutputBuffers() { int outputCount = TfLiteInterpreterGetOutputTensorCount(_interpreter); std::vector> results; results.reserve(outputCount); for (int32_t i = 0; i < outputCount; i++) { const TfLiteTensor* tensor = TfLiteInterpreterGetOutputTensor(_interpreter, i); std::shared_ptr outputBuffer = getOutputBufferForTensor(tensor); std::string name = TfLiteTensorName(tensor); void* tensorData = TfLiteTensorData(tensor); if (tensorData == nullptr) { [[unlikely]]; throw std::runtime_error("TFLite: Failed to get data from tensor \"" + name + "\"!"); } memcpy(outputBuffer->data(), tensorData, outputBuffer->size()); results.push_back(outputBuffer); } return results; } void HybridTfliteModel::invoke() { TfLiteStatus status = TfLiteInterpreterInvoke(_interpreter); if (status != kTfLiteOk) { throw std::runtime_error("TFLite: Failed to run TFLite Model! Status: " + tfLiteStatusToString(status)); } } std::vector> HybridTfliteModel::runSync(const std::vector>& input) { copyInputBuffers(input); invoke(); return copyOutputBuffers(); } std::shared_ptr>>> HybridTfliteModel::run(const std::vector>& input) { // Copy input buffers on caller (JS) thread first — input ArrayBuffers are // non-owning JS buffers that may be GC'd if we access them async. copyInputBuffers(input); std::shared_ptr sharedThis = shared_cast(); return Promise>>::async( [sharedThis]() -> std::vector> { sharedThis->invoke(); return sharedThis->copyOutputBuffers(); }); } } // namespace margelo::nitro::tflite