nvidia-vfx-prototyping/samples/BatchEffectApp/BatchEffectApp.cpp

/*###############################################################################
#
# Copyright (c) 2020 NVIDIA Corporation
#
# Permission is hereby granted, free of charge, to any person obtaining a copy of
# this software and associated documentation files (the "Software"), to deal in
# the Software without restriction, including without limitation the rights to
# use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of
# the Software, and to permit persons to whom the Software is furnished to do so,
# subject to the following conditions:
#
# The above copyright notice and this permission notice shall be included in all
# copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS
# FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR
# COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER
# IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
# CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
#
###############################################################################*/

#include <stdarg.h>
#include <stdio.h>
#include <string.h>

#include <string>

#include "BatchUtilities.h"
#include "nvCVOpenCV.h"
#include "nvVideoEffects.h"
#include "opencv2/opencv.hpp"

#ifdef _MSC_VER
  #define strcasecmp _stricmp
#endif // _MSC_VER

#define BAIL_IF_ERR(err)            do { if (0 != (err)) {                      goto bail; } } while(0)
#define BAIL_IF_NULL(x, err, code)  do { if ((void*)(x) == NULL)  { err = code; goto bail; } } while(0)
#define BAIL_IF_FALSE(x, err, code) do { if (!(x))                { err = code; goto bail; } } while(0)
#define BAIL(err, code)             do {                            err = code; goto bail;   } while(0)


bool                      FLAG_verbose        = false;
float                     FLAG_strength       = 0.f,
                          FLAG_scale          = 1.0;
int                       FLAG_mode           = 0,
                          FLAG_resolution     = 0;
std::string               FLAG_outFile,
                          FLAG_modelDir,
                          FLAG_effect;
std::vector<const char*>  FLAG_inFiles;

// Set this when using OTA Updates
// This path is used by nvVideoEffectsProxy.cpp to load the SDK dll
// when using  OTA Updates
char *g_nvVFXSDKPath = NULL;

static bool GetFlagArgVal(const char *flag, const char *arg, const char **val) {
  if (*arg != '-')
    return false;
  while (*++arg == '-')
    continue;
  const char *s = strchr(arg, '=');
  if (s == NULL)  {
    if (strcmp(flag, arg) != 0)
      return false;
    *val = NULL;
    return true;
  }
  size_t n = s - arg;
  if ((strlen(flag) != n) || (strncmp(flag, arg, n) != 0))
    return false;
  *val = s + 1;
  return true;
}

static bool GetFlagArgVal(const char *flag, const char *arg, std::string *val) {
  const char *valStr;
  if (!GetFlagArgVal(flag, arg, &valStr))
    return false;
  val->assign(valStr ? valStr : "");
  return true;
}

static bool GetFlagArgVal(const char *flag, const char *arg, bool *val) {
  const char *valStr;
  bool success = GetFlagArgVal(flag, arg, &valStr);
  if (success) {
    *val = (valStr == NULL ||
      strcasecmp(valStr, "true") == 0 ||
      strcasecmp(valStr, "on")   == 0 ||
      strcasecmp(valStr, "yes")  == 0 ||
      strcasecmp(valStr, "1")    == 0
      );
  }
  return success;
}

static bool GetFlagArgVal(const char *flag, const char *arg, float *val) {
  const char *valStr;
  bool success = GetFlagArgVal(flag, arg, &valStr);
  if (success)
    *val = strtof(valStr, NULL);
  return success;
}

static bool GetFlagArgVal(const char *flag, const char *arg, long *val) {
  const char *valStr;
  bool success = GetFlagArgVal(flag, arg, &valStr);
  if (success)
    *val = strtol(valStr, NULL, 10);
  return success;
}

static bool GetFlagArgVal(const char *flag, const char *arg, int *val) {
  long longVal;
  bool success = GetFlagArgVal(flag, arg, &longVal);
  if (success)
    *val = (int)longVal;
  return success;
}

static void Usage() {
  printf(
    "BatchEffectApp [flags ...] inFile1 [ inFileN ...]\n"
    "  where flags is:\n"
    "  --out_file=<path>     output image files to be written, default \"BatchOut_%%02u.png\"\n"
    "  --effect=<effect>     the effect to apply\n"
    "  --strength=<value>    strength of the upscaling effect, [0.0, 1.0]\n"
    "  --scale=<scale>       scale factor to be applied: 1.5, 2, 3, maybe 1.3333333\n"
    "  --resolution=<height> the desired height (either --scale or --resolution may be used)\n"
    "  --mode=<mode>         mode 0 or 1\n"
    "  --model_dir=<path>    the path to the directory that contains the models\n"
    "  --verbose             verbose output\n"
    "  and inFile1 ... are identically sized image files, e.g. png, jpg\n"
  );

  const char* cStr;
  NvCV_Status err = NvVFX_GetString(nullptr, NVVFX_INFO, &cStr);
  if (NVCV_SUCCESS != err)
    printf("Cannot get effects: %s\n", NvCV_GetErrorStringFromCode(err));
  printf("where effects are:\n%s", cStr);
}

static int ParseMyArgs(int argc, char **argv) {
  int errs = 0;
  for (--argc, ++argv; argc--; ++argv) {
    bool help;
    const char *arg = *argv;
    if (arg[0] == '-') {
      if (arg[1] == '-') {                                      // double-dash
        if (GetFlagArgVal("verbose",    arg, &FLAG_verbose)   ||
            GetFlagArgVal("effect",     arg, &FLAG_effect)    ||
            GetFlagArgVal("strength",   arg, &FLAG_strength)  ||
            GetFlagArgVal("scale",      arg, &FLAG_scale)     ||
            GetFlagArgVal("mode",       arg, &FLAG_mode)      ||
            GetFlagArgVal("model_dir",  arg, &FLAG_modelDir)  ||
            GetFlagArgVal("out_file",   arg, &FLAG_outFile)
        ) {
          continue;
        } else if (GetFlagArgVal("help", arg, &help)) {         // --help
          Usage();
          errs = 1;
        }
      }
      else {                                                    // single dash
        for (++arg; *arg; ++arg) {
          if (*arg == 'v') {
            FLAG_verbose = true;
          } else {
            printf("Unknown flag ignored: \"-%c\"\n", *arg);
          }
        }
        continue;
      }
    }
    else {                                                      // no dash
      FLAG_inFiles.push_back(arg);
    }
  }
  return errs;
}

static bool HasSuffix(const char *str, const char *suf) {
  size_t  strSize = strlen(str),
    sufSize = strlen(suf);
  if (strSize < sufSize)
    return false;
  return (0 == strcasecmp(suf, str + strSize - sufSize));
}

static bool HasOneOfTheseSuffixes(const char *str, ...) {
  bool matches = false;
  const char *suf;
  va_list ap;
  va_start(ap, str);
  while (nullptr != (suf = va_arg(ap, const char*))) {
    if (HasSuffix(str, suf)) {
      matches = true;
      break;
    }
  }
  va_end(ap);
  return matches;
}

static bool IsLossyImageFile(const char *str) {
  return HasOneOfTheseSuffixes(str, ".jpg", ".jpeg", nullptr);
}

class App {
public:
  NvVFX_Handle  _eff;
  NvCVImage     _src, _dst, _stg;
  CUstream      _stream;
  unsigned      _batchSize;

  App() : _eff(nullptr), _stream(0), _batchSize(0) {}
  ~App() { NvVFX_DestroyEffect(_eff); if (_stream) NvVFX_CudaStreamDestroy(_stream); }

  NvCV_Status init(const char* effectName, unsigned batchSize, const NvCVImage *src) {
    NvCV_Status err = NVCV_ERR_UNIMPLEMENTED;
    unsigned    dw, dh;

    if (FLAG_resolution) {
      dw = FLAG_resolution * src->width / src->height,  // No rounding
      dh = FLAG_resolution;
    }
    else {
      dw = lroundf(src->width  * FLAG_scale),
      dh = lroundf(src->height * FLAG_scale);
    }

    _batchSize = batchSize;
    BAIL_IF_ERR(err = NvVFX_CreateEffect(effectName, &_eff));

    if (!strcmp(effectName, NVVFX_FX_TRANSFER)) {
      BAIL_IF_ERR(err = AllocateBatchBuffer(&_src, _batchSize, src->width, src->height, NVCV_RGB, NVCV_U8, NVCV_CHUNKY, NVCV_CUDA, 0));
      BAIL_IF_ERR(err = AllocateBatchBuffer(&_dst, _batchSize, src->width, src->height, NVCV_RGB, NVCV_U8, NVCV_CHUNKY, NVCV_CUDA, 0));
    }
#ifdef NVVFX_FX_SR_UPSCALE
    else if (!strcmp(effectName, NVVFX_FX_SR_UPSCALE)) {
      BAIL_IF_ERR(err = AllocateBatchBuffer(&_src, _batchSize, src->width, src->height, NVCV_RGBA, NVCV_U8, NVCV_CHUNKY, NVCV_CUDA, 32)); // n*32, n>=0
      BAIL_IF_ERR(err = AllocateBatchBuffer(&_dst, _batchSize, dw,         dh,          NVCV_RGBA, NVCV_U8, NVCV_CHUNKY, NVCV_CUDA, 32));
      BAIL_IF_ERR(err = NvVFX_SetF32(_eff, NVVFX_STRENGTH, FLAG_strength));
    }
#endif // NVVFX_FX_SR_UPSCALE
#ifdef NVVFX_FX_ARTIFACT_REDUCTION
    else if (!strcmp(effectName, NVVFX_FX_ARTIFACT_REDUCTION)) {
      BAIL_IF_ERR(err = AllocateBatchBuffer(&_src, _batchSize, src->width, src->height, NVCV_BGR, NVCV_F32, NVCV_PLANAR, NVCV_CUDA, 1));
      BAIL_IF_ERR(err = AllocateBatchBuffer(&_dst, _batchSize, src->width, src->height, NVCV_BGR, NVCV_F32, NVCV_PLANAR, NVCV_CUDA, 1));
      BAIL_IF_ERR(err = NvVFX_SetString(_eff, NVVFX_MODEL_DIRECTORY, FLAG_modelDir.c_str()));
      BAIL_IF_ERR(err = NvVFX_SetU32(_eff, NVVFX_MODE, FLAG_mode));
    }
#endif // NVVFX_FX_ARTIFACT_REDUCTION
#ifdef NVVFX_FX_SUPER_RES
    else if (!strcmp(effectName, NVVFX_FX_SUPER_RES)) {
      BAIL_IF_ERR(err = AllocateBatchBuffer(&_src, _batchSize, src->width, src->height, NVCV_BGR, NVCV_F32, NVCV_PLANAR, NVCV_CUDA, 1));
      BAIL_IF_ERR(err = AllocateBatchBuffer(&_dst, _batchSize, dw,         dh,          NVCV_BGR, NVCV_F32, NVCV_PLANAR, NVCV_CUDA, 1));
      BAIL_IF_ERR(err = NvVFX_SetString(_eff, NVVFX_MODEL_DIRECTORY, FLAG_modelDir.c_str()));
      BAIL_IF_ERR(err = NvVFX_SetU32(_eff, NVVFX_MODE, FLAG_mode));
      BAIL_IF_ERR(err = NvVFX_SetF32(_eff, NVVFX_STRENGTH, FLAG_strength));
    }
#endif // NVVFX_FX_SUPER_RES
    else {
      BAIL(err, NVCV_ERR_UNIMPLEMENTED);
    }

    { // Set common parameters.
      NvCVImage nth;
      BAIL_IF_ERR(err = NvVFX_SetImage(_eff, NVVFX_INPUT_IMAGE,  NthImage(0, src->height,              &_src, &nth)));  // Set the first of the batched images in ...
      BAIL_IF_ERR(err = NvVFX_SetImage(_eff, NVVFX_OUTPUT_IMAGE, NthImage(0, _dst.height / _batchSize, &_dst, &nth)));  // ... and out
      BAIL_IF_ERR(err = NvVFX_CudaStreamCreate(&_stream));
      BAIL_IF_ERR(err = NvVFX_SetCudaStream(_eff, NVVFX_CUDA_STREAM, _stream));

      // The batch size parameter is interpreted at two times:
      // (1) during Load(), an appropriate batch-size model is chosen and loaded;
      // (2) during Run(), the specified number of images in the batch are processed.
      // The optimum throughput results from submitting a batch which is an integral multiple of the batched model
      // chosen in Load().
      //
      // To request a particular batch-sized model, set the batch size before calling Load(),
      // then get the batch size afterward to find out what batch-size model was chosen. If you do not specify the
      // desired batchSize before calling Load(), it will choose the batchSize=1 model, since that is the default
      // value for batchSize.
      //
      // After calling Load(), you can subsequently change the batch size to any number, even larger or smaller
      // than the batch size of the chosen model. If a larger  batch size is chosen, smaller batches are submitted
      // until the entire larger batch has been processed. In any event, the batch size should be set at least twice:
      // once before Load() and once before the initial Run(). In many server applications, it is expected that
      // the batch size is changing constantly as some videos complete and other are added, so setting the batchSize
      // before every Run() call would be typical.
      unsigned gotBatch;
      BAIL_IF_ERR(err = NvVFX_SetU32(_eff, NVVFX_MODEL_BATCH, _batchSize)); // Try to choose a model tuned to this batch size
      err = NvVFX_Load(_eff);                                               // This will load a new batched model -- a weighty process
      if (!(NVCV_SUCCESS == err || NVCV_ERR_MODELSUBSTITUTION == err)) goto bail;
      BAIL_IF_ERR(err = NvVFX_GetU32(_eff, NVVFX_MODEL_BATCH, &gotBatch));  // This tells us the batch size of the chosen model
      if (FLAG_verbose && gotBatch != _batchSize) {
        printf("Effect %s has no batch=%u model; processing in multiple batches of size %u%s instead\n",
            effectName, _batchSize, gotBatch, (gotBatch > 1 ? " or less" : ""));
        BAIL_IF_ERR(err = NvVFX_SetU32(_eff, NVVFX_BATCH_SIZE, _batchSize));  // This is lightweight, and usually done each Run
      }
    }

  bail:
    return err;
  }
};


NvCV_Status BatchProcessImages(const char* effectName, const std::vector<const char*>& srcImages, const char *outfilePattern) {
  NvCV_Status err       = NVCV_SUCCESS;
  unsigned    batchSize = (unsigned)srcImages.size();
  App         app;
  cv::Mat     ocv;
  NvCVImage   nvx;
  unsigned    srcWidth, srcHeight, dstHeight, i;

  // Read in the first image, to determine the resolution for init()
  BAIL_IF_FALSE(srcImages.size() > 0, err, NVCV_ERR_MISSINGINPUT);
  ocv = cv::imread(srcImages[0]);
  if (!ocv.data) {
    printf("Cannot read image file \"%s\"\n", srcImages[0]);
    BAIL(err, NVCV_ERR_READ);
  }
  NVWrapperForCVMat(&ocv, &nvx);
  srcWidth  = nvx.width;
  srcHeight = nvx.height;
  BAIL_IF_ERR(err = app.init(effectName, batchSize, &nvx)); // Init effect and buffers

  // Transfer the first image to the batch src.
  // Note, in all transfers, the scale factor only applies to floating-point pixels.
  BAIL_IF_ERR(err = TransferToNthImage(0, &nvx, &app._src, 1.f/255.f, app._stream, &app._stg));
  ocv.release();

  // Read the remaining images and transfer to the batch src
  for (i = 1; i < batchSize; ++i) {
    ocv = cv::imread(srcImages[i]);
    if (!ocv.data) {
      printf("Cannot read image file \"%s\"\n", srcImages[i]);
      BAIL(err, NVCV_ERR_READ);
    }
    NVWrapperForCVMat(&ocv, &nvx);
    if (!(nvx.width == srcWidth && nvx.height == srcHeight)) {
      printf("Input image file \"%s\" %ux%u does not match %ux%u\n", srcImages[i], nvx.width, nvx.height, srcWidth, srcHeight);
      BAIL(err, NVCV_ERR_MISMATCH);
    }
    BAIL_IF_ERR(err = TransferToNthImage(i, &nvx, &app._src, 1.f / 255.f, app._stream, &app._stg));
    ocv.release();
  }

  // Run batch
  BAIL_IF_ERR(err = NvVFX_SetU32(app._eff, NVVFX_BATCH_SIZE, (unsigned)srcImages.size()));  // The batchSize can change every Run
  BAIL_IF_ERR(err = NvVFX_Run(app._eff, 0));

  // Retrieve and write images
  dstHeight = app._dst.height / batchSize;
  BAIL_IF_ERR(err = NvCVImage_Alloc(&nvx, app._dst.width, dstHeight, ((app._dst.numComponents == 1) ? NVCV_Y : NVCV_BGR), NVCV_U8, NVCV_CHUNKY, NVCV_CPU, 0));
  CVWrapperForNvCVImage(&nvx, &ocv);
  if(IsLossyImageFile(outfilePattern))
    fprintf(stderr, "WARNING: JPEG output file format will reduce image quality\n");
  for (i = 0; i < batchSize; ++i) {
    char fileName[1024];
    snprintf(fileName, sizeof(fileName), outfilePattern, i);
    BAIL_IF_ERR(err = TransferFromNthImage(i, &app._dst, &nvx, 255.f, app._stream, &app._stg));
    if (!cv::imwrite(fileName, ocv)) {
      printf("Cannot write image file \"%s\"\n", fileName);
      BAIL(err, NVCV_ERR_WRITE);
    }
  }
  // NvCVImage_Dealloc() is called in the destructors

bail:
  return err;
}


int main(int argc, char** argv) {
  int         nErrs;
  NvCV_Status vfxErr;

  nErrs = ParseMyArgs(argc, argv);
  if (nErrs)
    return nErrs;

  if (FLAG_outFile.empty())
    FLAG_outFile = "BatchOut_%02u.png";
  else if (std::string::npos == FLAG_outFile.find_first_of('%'))
    FLAG_outFile.insert(FLAG_outFile.size() - 4, "_%02u");  // assuming .xxx, i.e. .jpg, .png

  vfxErr = BatchProcessImages(FLAG_effect.c_str(), FLAG_inFiles, FLAG_outFile.c_str());
  if (NVCV_SUCCESS != vfxErr) {
    printf("Error: %s\n", NvCV_GetErrorStringFromCode(vfxErr));
    nErrs = (int)vfxErr;
  }

  return nErrs;
}