jyoung/selfdrive/modeld/runners/snpemodel.cc

#pragma clang diagnostic ignored "-Wexceptions"

#include "selfdrive/modeld/runners/snpemodel.h"

#include <cstring>
#include <memory>
#include <string>
#include <utility>
#include <vector>

#include "common/util.h"
#include "common/timing.h"

void PrintErrorStringAndExit() {
  std::cerr << zdl::DlSystem::getLastErrorString() << std::endl;
  std::exit(EXIT_FAILURE);
}

SNPEModel::SNPEModel(const std::string path, float *_output, size_t _output_size, int runtime, bool _use_tf8, cl_context context) {
  output = _output;
  output_size = _output_size;
  use_tf8 = _use_tf8;

#ifdef QCOM2
  if (runtime == USE_GPU_RUNTIME) {
    snpe_runtime = zdl::DlSystem::Runtime_t::GPU;
  } else if (runtime == USE_DSP_RUNTIME) {
    snpe_runtime = zdl::DlSystem::Runtime_t::DSP;
  } else {
    snpe_runtime = zdl::DlSystem::Runtime_t::CPU;
  }
  assert(zdl::SNPE::SNPEFactory::isRuntimeAvailable(snpe_runtime));
#endif
  model_data = util::read_file(path);
  assert(model_data.size() > 0);

  // load model
  std::unique_ptr<zdl::DlContainer::IDlContainer> container = zdl::DlContainer::IDlContainer::open((uint8_t*)model_data.data(), model_data.size());
  if (!container) { PrintErrorStringAndExit(); }
  LOGW("loaded model with size: %lu", model_data.size());

  // create model runner
  zdl::SNPE::SNPEBuilder snpe_builder(container.get());
  while (!snpe) {
#ifdef QCOM2
    snpe = snpe_builder.setOutputLayers({})
                       .setRuntimeProcessor(snpe_runtime)
                       .setUseUserSuppliedBuffers(true)
                       .setPerformanceProfile(zdl::DlSystem::PerformanceProfile_t::HIGH_PERFORMANCE)
                       .build();
#else
    snpe = snpe_builder.setOutputLayers({})
                       .setUseUserSuppliedBuffers(true)
                       .setPerformanceProfile(zdl::DlSystem::PerformanceProfile_t::HIGH_PERFORMANCE)
                       .build();
#endif
    if (!snpe) std::cerr << zdl::DlSystem::getLastErrorString() << std::endl;
  }

  // create output buffer
  zdl::DlSystem::UserBufferEncodingFloat ub_encoding_float;
  zdl::DlSystem::IUserBufferFactory &ub_factory = zdl::SNPE::SNPEFactory::getUserBufferFactory();

  const auto &output_tensor_names_opt = snpe->getOutputTensorNames();
  if (!output_tensor_names_opt) throw std::runtime_error("Error obtaining output tensor names");
  const auto &output_tensor_names = *output_tensor_names_opt;
  assert(output_tensor_names.size() == 1);
  const char *output_tensor_name = output_tensor_names.at(0);
  const zdl::DlSystem::TensorShape &buffer_shape = snpe->getInputOutputBufferAttributes(output_tensor_name)->getDims();
  if (output_size != 0) {
    assert(output_size == buffer_shape[1]);
  } else {
    output_size = buffer_shape[1];
  }
  std::vector<size_t> output_strides = {output_size * sizeof(float), sizeof(float)};
  output_buffer = ub_factory.createUserBuffer(output, output_size * sizeof(float), output_strides, &ub_encoding_float);
  output_map.add(output_tensor_name, output_buffer.get());
}

void SNPEModel::addInput(const std::string name, float *buffer, int size) {
  const int idx = inputs.size();
  const auto &input_tensor_names_opt = snpe->getInputTensorNames();
  if (!input_tensor_names_opt) throw std::runtime_error("Error obtaining input tensor names");
  const auto &input_tensor_names = *input_tensor_names_opt;
  const char *input_tensor_name = input_tensor_names.at(idx);
  const bool input_tf8 = use_tf8 && strcmp(input_tensor_name, "input_img") == 0;  // TODO: This is a terrible hack, get rid of this name check both here and in onnx_runner.py
  LOGW("adding index %d: %s", idx, input_tensor_name);

  zdl::DlSystem::UserBufferEncodingFloat ub_encoding_float;
  zdl::DlSystem::UserBufferEncodingTf8 ub_encoding_tf8(0, 1./255); // network takes 0-1
  zdl::DlSystem::IUserBufferFactory &ub_factory = zdl::SNPE::SNPEFactory::getUserBufferFactory();
  zdl::DlSystem::UserBufferEncoding *input_encoding = input_tf8 ? (zdl::DlSystem::UserBufferEncoding*)&ub_encoding_tf8 : (zdl::DlSystem::UserBufferEncoding*)&ub_encoding_float;

  const auto &buffer_shape_opt = snpe->getInputDimensions(input_tensor_name);
  const zdl::DlSystem::TensorShape &buffer_shape = *buffer_shape_opt;
  size_t size_of_input = input_tf8 ? sizeof(uint8_t) : sizeof(float);
  std::vector<size_t> strides(buffer_shape.rank());
  strides[strides.size() - 1] = size_of_input;
  size_t product = 1;
  for (size_t i = 0; i < buffer_shape.rank(); i++) product *= buffer_shape[i];
  size_t stride = strides[strides.size() - 1];
  for (size_t i = buffer_shape.rank() - 1; i > 0; i--) {
    stride *= buffer_shape[i];
    strides[i-1] = stride;
  }

  auto input_buffer = ub_factory.createUserBuffer(buffer, product*size_of_input, strides, input_encoding);
  input_map.add(input_tensor_name, input_buffer.get());
  inputs.push_back(std::unique_ptr<SNPEModelInput>(new SNPEModelInput(name, buffer, size, std::move(input_buffer))));
}

void SNPEModel::execute() {
  if (!snpe->execute(input_map, output_map)) {
    PrintErrorStringAndExit();
  }
}
-Werror (#1567) * werror * -Wno-inconsistent-missing-override * Silence ffmpeg deprecation warnings * add some more pragmas to ignore warnings Co-authored-by: Comma Device <device@comma.ai> 6 years ago			`#pragma clang diagnostic ignored "-Wexceptions"`

Cleanup selfdrive/ includes (#20822) * cleanup include path * continue * format includes * fix testraw.cc * remove include path from SConstruct * regroup * rebase master * almost done * apply review * rename FileReader.xx to filereader.xx * rename Unlogger.x->unlogger.x * rename FrameReader.xx -> framereader.xx * apply reviews * ui.h * continue * fix framebuffer.cc build error:mv util.h up * full path to msm_media_info * fix qcom2 camerad Co-authored-by: Comma Device <device@comma.ai> 5 years ago			`#include "selfdrive/modeld/runners/snpemodel.h"`

Use C++ header files instead of C header files. (#21192) * use cstring instead of string.h * use cstdio instead of stdio.h * remove inttypes.h * use cstdlib instead of stdlib.h * use cstdint instead of stdint.h * #include <cstddef> * cstdlib * use cmath * remove stddef.h * use cassert * use csignal * use ctime * use cerror * rebase master 4 years ago			`#include <cstring>`
cpplint: `build/include_what_you_use` (#29556) * include_what_you_use * remove comments * include <memory> --------- Co-authored-by: Adeeb Shihadeh <adeebshihadeh@gmail.com> 2 years ago			`#include <memory>`
			`#include <string>`
			`#include <utility>`
			`#include <vector>`
Cleanup selfdrive/ includes (#20822) * cleanup include path * continue * format includes * fix testraw.cc * remove include path from SConstruct * regroup * rebase master * almost done * apply review * rename FileReader.xx to filereader.xx * rename Unlogger.x->unlogger.x * rename FrameReader.xx -> framereader.xx * apply reviews * ui.h * continue * fix framebuffer.cc build error:mv util.h up * full path to msm_media_info * fix qcom2 camerad Co-authored-by: Comma Device <device@comma.ai> 5 years ago
Merge common/ and selfdrive/common (#24556) * Merge common/ and selfdrive/common * fix that * fix version * fix unit tests 4 years ago			`#include "common/util.h"`
			`#include "common/timing.h"`
logcatd, loggerd, mapd, modeld, proclogd 6 years ago
			`void PrintErrorStringAndExit() {`
			`std::cerr << zdl::DlSystem::getLastErrorString() << std::endl;`
			`std::exit(EXIT_FAILURE);`
			`}`

Refactor model runners (#28598) * Started work on model runner refactor * Fixed some compile errors * everything compiles * Fixed bug in SNPEModel * updateInput -> setInputBuffer * I understand nothing * whoops lol * use std::string instead of char* * Move common logic into RunModel * formatting fix 2 years ago			`SNPEModel::SNPEModel(const std::string path, float *_output, size_t _output_size, int runtime, bool _use_tf8, cl_context context) {`
			`output = _output;`
			`output_size = _output_size;`
			`use_tf8 = _use_tf8;`

remove comma two support (#24248) * remove comma two support * cleanup release files * little more * more libs * no more gralloc * add snpe back 4 years ago			`#ifdef QCOM2`
Refactor model runners (#28598) * Started work on model runner refactor * Fixed some compile errors * everything compiles * Fixed bug in SNPEModel * updateInput -> setInputBuffer * I understand nothing * whoops lol * use std::string instead of char* * Move common logic into RunModel * formatting fix 2 years ago			`if (runtime == USE_GPU_RUNTIME) {`
			`snpe_runtime = zdl::DlSystem::Runtime_t::GPU;`
			`} else if (runtime == USE_DSP_RUNTIME) {`
			`snpe_runtime = zdl::DlSystem::Runtime_t::DSP;`
logcatd, loggerd, mapd, modeld, proclogd 6 years ago			`} else {`
Refactor model runners (#28598) * Started work on model runner refactor * Fixed some compile errors * everything compiles * Fixed bug in SNPEModel * updateInput -> setInputBuffer * I understand nothing * whoops lol * use std::string instead of char* * Move common logic into RunModel * formatting fix 2 years ago			`snpe_runtime = zdl::DlSystem::Runtime_t::CPU;`
logcatd, loggerd, mapd, modeld, proclogd 6 years ago			`}`
Refactor model runners (#28598) * Started work on model runner refactor * Fixed some compile errors * everything compiles * Fixed bug in SNPEModel * updateInput -> setInputBuffer * I understand nothing * whoops lol * use std::string instead of char* * Move common logic into RunModel * formatting fix 2 years ago			`assert(zdl::SNPE::SNPEFactory::isRuntimeAvailable(snpe_runtime));`
logcatd, loggerd, mapd, modeld, proclogd 6 years ago			`#endif`
util.cc: reduce two read_file functions into one (#20655) * no need to malloc one extra byte * combine two read_file into a faster one * cleanup #include * use resize * apply suggestions from review * space * rebase master 5 years ago			`model_data = util::read_file(path);`
			`assert(model_data.size() > 0);`
logcatd, loggerd, mapd, modeld, proclogd 6 years ago
			`// load model`
util.cc: reduce two read_file functions into one (#20655) * no need to malloc one extra byte * combine two read_file into a faster one * cleanup #include * use resize * apply suggestions from review * space * rebase master 5 years ago			`std::unique_ptr<zdl::DlContainer::IDlContainer> container = zdl::DlContainer::IDlContainer::open((uint8_t*)model_data.data(), model_data.size());`
logcatd, loggerd, mapd, modeld, proclogd 6 years ago			`if (!container) { PrintErrorStringAndExit(); }`
dmonitoringmodeld: add more logging around the init (#28920) 2 years ago			`LOGW("loaded model with size: %lu", model_data.size());`
logcatd, loggerd, mapd, modeld, proclogd 6 years ago
			`// create model runner`
Refactor model runners (#28598) * Started work on model runner refactor * Fixed some compile errors * everything compiles * Fixed bug in SNPEModel * updateInput -> setInputBuffer * I understand nothing * whoops lol * use std::string instead of char* * Move common logic into RunModel * formatting fix 2 years ago			`zdl::SNPE::SNPEBuilder snpe_builder(container.get());`
logcatd, loggerd, mapd, modeld, proclogd 6 years ago			`while (!snpe) {`
remove comma two support (#24248) * remove comma two support * cleanup release files * little more * more libs * no more gralloc * add snpe back 4 years ago			`#ifdef QCOM2`
Refactor model runners (#28598) * Started work on model runner refactor * Fixed some compile errors * everything compiles * Fixed bug in SNPEModel * updateInput -> setInputBuffer * I understand nothing * whoops lol * use std::string instead of char* * Move common logic into RunModel * formatting fix 2 years ago			`snpe = snpe_builder.setOutputLayers({})`
			`.setRuntimeProcessor(snpe_runtime)`
			`.setUseUserSuppliedBuffers(true)`
			`.setPerformanceProfile(zdl::DlSystem::PerformanceProfile_t::HIGH_PERFORMANCE)`
			`.build();`
logcatd, loggerd, mapd, modeld, proclogd 6 years ago			`#else`
Refactor model runners (#28598) * Started work on model runner refactor * Fixed some compile errors * everything compiles * Fixed bug in SNPEModel * updateInput -> setInputBuffer * I understand nothing * whoops lol * use std::string instead of char* * Move common logic into RunModel * formatting fix 2 years ago			`snpe = snpe_builder.setOutputLayers({})`
			`.setUseUserSuppliedBuffers(true)`
			`.setPerformanceProfile(zdl::DlSystem::PerformanceProfile_t::HIGH_PERFORMANCE)`
			`.build();`
logcatd, loggerd, mapd, modeld, proclogd 6 years ago			`#endif`
			`if (!snpe) std::cerr << zdl::DlSystem::getLastErrorString() << std::endl;`
			`}`

			`// create output buffer`
Refactor model runners (#28598) * Started work on model runner refactor * Fixed some compile errors * everything compiles * Fixed bug in SNPEModel * updateInput -> setInputBuffer * I understand nothing * whoops lol * use std::string instead of char* * Move common logic into RunModel * formatting fix 2 years ago			`zdl::DlSystem::UserBufferEncodingFloat ub_encoding_float;`
			`zdl::DlSystem::IUserBufferFactory &ub_factory = zdl::SNPE::SNPEFactory::getUserBufferFactory();`

			`const auto &output_tensor_names_opt = snpe->getOutputTensorNames();`
			`if (!output_tensor_names_opt) throw std::runtime_error("Error obtaining output tensor names");`
			`const auto &output_tensor_names = *output_tensor_names_opt;`
			`assert(output_tensor_names.size() == 1);`
			`const char *output_tensor_name = output_tensor_names.at(0);`
			`const zdl::DlSystem::TensorShape &buffer_shape = snpe->getInputOutputBufferAttributes(output_tensor_name)->getDims();`
			`if (output_size != 0) {`
			`assert(output_size == buffer_shape[1]);`
			`} else {`
			`output_size = buffer_shape[1];`
logcatd, loggerd, mapd, modeld, proclogd 6 years ago			`}`
Refactor model runners (#28598) * Started work on model runner refactor * Fixed some compile errors * everything compiles * Fixed bug in SNPEModel * updateInput -> setInputBuffer * I understand nothing * whoops lol * use std::string instead of char* * Move common logic into RunModel * formatting fix 2 years ago			`std::vector<size_t> output_strides = {output_size * sizeof(float), sizeof(float)};`
			`output_buffer = ub_factory.createUserBuffer(output, output_size * sizeof(float), output_strides, &ub_encoding_float);`
			`output_map.add(output_tensor_name, output_buffer.get());`
logcatd, loggerd, mapd, modeld, proclogd 6 years ago			`}`

Refactor model runners (#28598) * Started work on model runner refactor * Fixed some compile errors * everything compiles * Fixed bug in SNPEModel * updateInput -> setInputBuffer * I understand nothing * whoops lol * use std::string instead of char* * Move common logic into RunModel * formatting fix 2 years ago			`void SNPEModel::addInput(const std::string name, float *buffer, int size) {`
			`const int idx = inputs.size();`
			`const auto &input_tensor_names_opt = snpe->getInputTensorNames();`
			`if (!input_tensor_names_opt) throw std::runtime_error("Error obtaining input tensor names");`
			`const auto &input_tensor_names = *input_tensor_names_opt;`
			`const char *input_tensor_name = input_tensor_names.at(idx);`
			`const bool input_tf8 = use_tf8 && strcmp(input_tensor_name, "input_img") == 0; // TODO: This is a terrible hack, get rid of this name check both here and in onnx_runner.py`
dmonitoringmodeld: add more logging around the init (#28920) 2 years ago			`LOGW("adding index %d: %s", idx, input_tensor_name);`
Refactor model runners (#28598) * Started work on model runner refactor * Fixed some compile errors * everything compiles * Fixed bug in SNPEModel * updateInput -> setInputBuffer * I understand nothing * whoops lol * use std::string instead of char* * Move common logic into RunModel * formatting fix 2 years ago
			`zdl::DlSystem::UserBufferEncodingFloat ub_encoding_float;`
			`zdl::DlSystem::UserBufferEncodingTf8 ub_encoding_tf8(0, 1./255); // network takes 0-1`
			`zdl::DlSystem::IUserBufferFactory &ub_factory = zdl::SNPE::SNPEFactory::getUserBufferFactory();`
			`zdl::DlSystem::UserBufferEncoding input_encoding = input_tf8 ? (zdl::DlSystem::UserBufferEncoding)&ub_encoding_tf8 : (zdl::DlSystem::UserBufferEncoding*)&ub_encoding_float;`

			`const auto &buffer_shape_opt = snpe->getInputDimensions(input_tensor_name);`
			`const zdl::DlSystem::TensorShape &buffer_shape = *buffer_shape_opt;`
			`size_t size_of_input = input_tf8 ? sizeof(uint8_t) : sizeof(float);`
			`std::vector<size_t> strides(buffer_shape.rank());`
			`strides[strides.size() - 1] = size_of_input;`
			`size_t product = 1;`
			`for (size_t i = 0; i < buffer_shape.rank(); i++) product *= buffer_shape[i];`
			`size_t stride = strides[strides.size() - 1];`
			`for (size_t i = buffer_shape.rank() - 1; i > 0; i--) {`
			`stride *= buffer_shape[i];`
			`strides[i-1] = stride;`
			`}`
bigmodel (#23684) * Added wide cam vipc client and bigmodel transform logic * Added wide_frame to ModelState, should still work normally * Refactored image input into addImage method, should still work normally * Updated thneed/compile.cc * Bigmodel, untested: 44f83118-b375-4d4c-ae12-2017124f0cf4/200 * Have to initialize extra buffer in SNPEModel * Default paramater value in the wrong place I think * Move USE_EXTRA to SConscript * New model: 6c34d59a-acc3-4877-84bd-904c10745ba6/250 * move use extra check to runtime, not on C2 * this is always true * more C2 checks * log if frames are out of sync * more logging on no frame * store in pointer * print sof * add sync logic * log based on sof difference as well * keep both models * less assumptions * define above thneed * typo * simplify * no need for second client is main is already wide * more comments update * no optional reference * more logging to debug lags * add to release files * both defines * New model: 6831a77f-2574-4bfb-8077-79b0972a2771/950 * Path offset no longer relevant * Remove duplicate execute * Moved bigmodel back to big_supercombo.dlc * add wide vipc stream * Tici must be tici * Needs state too * add wide cam support to model replay * handle syncing better * ugh, c2 * print that * handle ecam lag * skip first one * so close * update refs Co-authored-by: mitchellgoffpc <mitchellgoffpc@gmail.com> Co-authored-by: Harald Schafer <harald.the.engineer@gmail.com> Co-authored-by: Adeeb Shihadeh <adeebshihadeh@gmail.com> Co-authored-by: Comma Device <device@comma.ai> 4 years ago
Refactor model runners (#28598) * Started work on model runner refactor * Fixed some compile errors * everything compiles * Fixed bug in SNPEModel * updateInput -> setInputBuffer * I understand nothing * whoops lol * use std::string instead of char* * Move common logic into RunModel * formatting fix 2 years ago			`auto input_buffer = ub_factory.createUserBuffer(buffer, product*size_of_input, strides, input_encoding);`
			`input_map.add(input_tensor_name, input_buffer.get());`
			`inputs.push_back(std::unique_ptr<SNPEModelInput>(new SNPEModelInput(name, buffer, size, std::move(input_buffer))));`
logcatd, loggerd, mapd, modeld, proclogd 6 years ago			`}`

bigmodel (#23684) * Added wide cam vipc client and bigmodel transform logic * Added wide_frame to ModelState, should still work normally * Refactored image input into addImage method, should still work normally * Updated thneed/compile.cc * Bigmodel, untested: 44f83118-b375-4d4c-ae12-2017124f0cf4/200 * Have to initialize extra buffer in SNPEModel * Default paramater value in the wrong place I think * Move USE_EXTRA to SConscript * New model: 6c34d59a-acc3-4877-84bd-904c10745ba6/250 * move use extra check to runtime, not on C2 * this is always true * more C2 checks * log if frames are out of sync * more logging on no frame * store in pointer * print sof * add sync logic * log based on sof difference as well * keep both models * less assumptions * define above thneed * typo * simplify * no need for second client is main is already wide * more comments update * no optional reference * more logging to debug lags * add to release files * both defines * New model: 6831a77f-2574-4bfb-8077-79b0972a2771/950 * Path offset no longer relevant * Remove duplicate execute * Moved bigmodel back to big_supercombo.dlc * add wide vipc stream * Tici must be tici * Needs state too * add wide cam support to model replay * handle syncing better * ugh, c2 * print that * handle ecam lag * skip first one * so close * update refs Co-authored-by: mitchellgoffpc <mitchellgoffpc@gmail.com> Co-authored-by: Harald Schafer <harald.the.engineer@gmail.com> Co-authored-by: Adeeb Shihadeh <adeebshihadeh@gmail.com> Co-authored-by: Comma Device <device@comma.ai> 4 years ago			`void SNPEModel::execute() {`
Refactor model runners (#28598) * Started work on model runner refactor * Fixed some compile errors * everything compiles * Fixed bug in SNPEModel * updateInput -> setInputBuffer * I understand nothing * whoops lol * use std::string instead of char* * Move common logic into RunModel * formatting fix 2 years ago			`if (!snpe->execute(input_map, output_map)) {`
modeld: delete unused SNPE stuff after move to tinygrad (#25635) * delete unused stuff * remove CL interceptor from thneed since we don't use SNPE anymore * remove dead files from release * that's removed * oops, didn't save 3 years ago			`PrintErrorStringAndExit();`
logcatd, loggerd, mapd, modeld, proclogd 6 years ago			`}`
			`}`