RONCC
/
NVIDIA-AI-Image-Classification


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120
							/**
 * Copyright (c) 2018, NVIDIA CORPORATION. All rights reserved.
 * Full license terms provided in LICENSE.md file.
 */

#ifndef TRT_IMAGE_CLASSIFICATION_UTILS_H
#define TRT_IMAGE_CLASSIFICATION_UTILS_H


#include <opencv2/opencv.hpp>
#include <vector>
#include <algorithm>
#include <NvInfer.h>


void cvImageToTensor(const cv::Mat & image, float *tensor, nvinfer1::Dims dimensions)
{
  const size_t channels = dimensions.d[0];
  const size_t height = dimensions.d[1];
  const size_t width = dimensions.d[2];
  // TODO: validate dimensions match
  const size_t stridesCv[3] = { width * channels, channels, 1 };
  const size_t strides[3] = { height * width, width, 1 };

  for (int i = 0; i < height; i++) 
  {
    for (int j = 0; j < width; j++) 
    {
      for (int k = 0; k < channels; k++) 
      {
        const size_t offsetCv = i * stridesCv[0] + j * stridesCv[1] + k * stridesCv[2];
        const size_t offset = k * strides[0] + i * strides[1] + j * strides[2];
        tensor[offset] = (float) image.data[offsetCv];
      }
    }
  }
}

void preprocessVgg(float *tensor, nvinfer1::Dims dimensions)
{
  size_t channels = dimensions.d[0];
  size_t height = dimensions.d[1];
  size_t width = dimensions.d[2];
  const size_t strides[3] = { height * width, width, 1 };
  const float mean[3] = { 123.68, 116.78, 103.94 }; // values from TensorFlow slim models code

  for (int i = 0; i < height; i++) 
  {
    for (int j = 0; j < width; j++) 
    {
      for (int k = 0; k < channels; k++) 
      {
        const size_t offset = k * strides[0] + i * strides[1] + j * strides[2];
        tensor[offset] -= mean[k];
      }
    }
  }
}

void preprocessInception(float *tensor, nvinfer1::Dims dimensions)
{
  size_t channels = dimensions.d[0];
  size_t height = dimensions.d[1];
  size_t width = dimensions.d[2];

  const size_t numel = channels * height * width;
  for (int i = 0; i < numel; i++)
    tensor[i] = 2.0 * (tensor[i] / 255.0 - 0.5); // values from TensorFlow slim models code
}

int argmax(float *tensor, nvinfer1::Dims dimensions)
{
  size_t channels = dimensions.d[0];
  size_t height = dimensions.d[1];
  size_t width = dimensions.d[2];

  size_t numel = channels * height * width;

  if (numel <= 0)
    return 0;

  size_t maxIndex = 0;
  float max = tensor[0]; 
  for (int i = 0; i < numel; i++)
  {
    if (tensor[i] > max)
    {
      maxIndex = i;
      max = tensor[i];
    }
  }

  return maxIndex;
}

size_t numTensorElements(nvinfer1::Dims dimensions)
{
  if (dimensions.nbDims == 0)
    return 0;
  size_t size = 1;
  for (int i = 0; i < dimensions.nbDims; i++)
    size *= dimensions.d[i];
  return size;
}

std::vector<size_t> argsort(float *tensor, nvinfer1::Dims dimensions)
{
  size_t numel = numTensorElements(dimensions);
  std::vector<size_t> indices(numel);
  for (int i = 0; i < numel; i++)
    indices[i] = i;
  std::sort(indices.begin(), indices.begin() + numel, [tensor](size_t idx1, size_t idx2) {
      return tensor[idx1] > tensor[idx2];
  });

  return indices;
}

#endif