pytorch_vision_jni.cpp (revision da0073e96a02ea20f0ac840b70461e3646d07c45) - OpenGrok cross reference for /aosp_15_r20/external/pytorch/android/pytorch_android_torchvision/src/main/cpp/pytorch_vision_jni.cpp

#include <cassert>
#include <cmath>
#include <vector>

#include "jni.h"

namespace pytorch_vision_jni {

static void imageYUV420CenterCropToFloatBuffer(
    JNIEnv* jniEnv,
    jclass,
    jobject yBuffer,
    jint yRowStride,
    jint yPixelStride,
    jobject uBuffer,
    jobject vBuffer,
    jint uRowStride,
    jint uvPixelStride,
    jint imageWidth,
    jint imageHeight,
    jint rotateCWDegrees,
    jint tensorWidth,
    jint tensorHeight,
    jfloatArray jnormMeanRGB,
    jfloatArray jnormStdRGB,
    jobject outBuffer,
    jint outOffset,
    jint memoryFormatCode) {
  constexpr static int32_t kMemoryFormatContiguous = 1;
  constexpr static int32_t kMemoryFormatChannelsLast = 2;

  float* outData = (float*)jniEnv->GetDirectBufferAddress(outBuffer);

  jfloat normMeanRGB[3];
  jfloat normStdRGB[3];
  jniEnv->GetFloatArrayRegion(jnormMeanRGB, 0, 3, normMeanRGB);
  jniEnv->GetFloatArrayRegion(jnormStdRGB, 0, 3, normStdRGB);
  int widthAfterRtn = imageWidth;
  int heightAfterRtn = imageHeight;
  bool oddRotation = rotateCWDegrees == 90 || rotateCWDegrees == 270;
  if (oddRotation) {
    widthAfterRtn = imageHeight;
    heightAfterRtn = imageWidth;
  }

  int cropWidthAfterRtn = widthAfterRtn;
  int cropHeightAfterRtn = heightAfterRtn;

  if (tensorWidth * heightAfterRtn <= tensorHeight * widthAfterRtn) {
    cropWidthAfterRtn = tensorWidth * heightAfterRtn / tensorHeight;
  } else {
    cropHeightAfterRtn = tensorHeight * widthAfterRtn / tensorWidth;
  }

  int cropWidthBeforeRtn = cropWidthAfterRtn;
  int cropHeightBeforeRtn = cropHeightAfterRtn;
  if (oddRotation) {
    cropWidthBeforeRtn = cropHeightAfterRtn;
    cropHeightBeforeRtn = cropWidthAfterRtn;
  }

  const int offsetX = (imageWidth - cropWidthBeforeRtn) / 2.f;
  const int offsetY = (imageHeight - cropHeightBeforeRtn) / 2.f;

  const uint8_t* yData = (uint8_t*)jniEnv->GetDirectBufferAddress(yBuffer);
  const uint8_t* uData = (uint8_t*)jniEnv->GetDirectBufferAddress(uBuffer);
  const uint8_t* vData = (uint8_t*)jniEnv->GetDirectBufferAddress(vBuffer);

  float scale = cropWidthAfterRtn / tensorWidth;
  int uvRowStride = uRowStride;
  int cropXMult = 1;
  int cropYMult = 1;
  int cropXAdd = offsetX;
  int cropYAdd = offsetY;
  if (rotateCWDegrees == 90) {
    cropYMult = -1;
    cropYAdd = offsetY + (cropHeightBeforeRtn - 1);
  } else if (rotateCWDegrees == 180) {
    cropXMult = -1;
    cropXAdd = offsetX + (cropWidthBeforeRtn - 1);
    cropYMult = -1;
    cropYAdd = offsetY + (cropHeightBeforeRtn - 1);
  } else if (rotateCWDegrees == 270) {
    cropXMult = -1;
    cropXAdd = offsetX + (cropWidthBeforeRtn - 1);
  }

  float normMeanRm255 = 255 * normMeanRGB[0];
  float normMeanGm255 = 255 * normMeanRGB[1];
  float normMeanBm255 = 255 * normMeanRGB[2];
  float normStdRm255 = 255 * normStdRGB[0];
  float normStdGm255 = 255 * normStdRGB[1];
  float normStdBm255 = 255 * normStdRGB[2];

  int xBeforeRtn, yBeforeRtn;
  int yi, yIdx, uvIdx, ui, vi, a0, ri, gi, bi;
  int channelSize = tensorWidth * tensorHeight;
  // A bit of code duplication to avoid branching in the cycles
  if (memoryFormatCode == kMemoryFormatContiguous) {
    int wr = outOffset;
    int wg = wr + channelSize;
    int wb = wg + channelSize;
    for (int y = 0; y < tensorHeight; y++) {
      for (int x = 0; x < tensorWidth; x++) {
        xBeforeRtn = cropXAdd + cropXMult * (int)(x * scale);
        yBeforeRtn = cropYAdd + cropYMult * (int)(y * scale);
        yIdx = yBeforeRtn * yRowStride + xBeforeRtn * yPixelStride;
        uvIdx =
            (yBeforeRtn >> 1) * uvRowStride + (xBeforeRtn >> 1) * uvPixelStride;
        ui = uData[uvIdx];
        vi = vData[uvIdx];
        yi = yData[yIdx];
        yi = (yi - 16) < 0 ? 0 : (yi - 16);
        ui -= 128;
        vi -= 128;
        a0 = 1192 * yi;
        ri = (a0 + 1634 * vi) >> 10;
        gi = (a0 - 833 * vi - 400 * ui) >> 10;
        bi = (a0 + 2066 * ui) >> 10;
        ri = ri > 255 ? 255 : ri < 0 ? 0 : ri;
        gi = gi > 255 ? 255 : gi < 0 ? 0 : gi;
        bi = bi > 255 ? 255 : bi < 0 ? 0 : bi;
        outData[wr++] = (ri - normMeanRm255) / normStdRm255;
        outData[wg++] = (gi - normMeanGm255) / normStdGm255;
        outData[wb++] = (bi - normMeanBm255) / normStdBm255;
      }
    }
  } else if (memoryFormatCode == kMemoryFormatChannelsLast) {
    int wc = outOffset;
    for (int y = 0; y < tensorHeight; y++) {
      for (int x = 0; x < tensorWidth; x++) {
        xBeforeRtn = cropXAdd + cropXMult * (int)(x * scale);
        yBeforeRtn = cropYAdd + cropYMult * (int)(y * scale);
        yIdx = yBeforeRtn * yRowStride + xBeforeRtn * yPixelStride;
        uvIdx =
            (yBeforeRtn >> 1) * uvRowStride + (xBeforeRtn >> 1) * uvPixelStride;
        ui = uData[uvIdx];
        vi = vData[uvIdx];
        yi = yData[yIdx];
        yi = (yi - 16) < 0 ? 0 : (yi - 16);
        ui -= 128;
        vi -= 128;
        a0 = 1192 * yi;
        ri = (a0 + 1634 * vi) >> 10;
        gi = (a0 - 833 * vi - 400 * ui) >> 10;
        bi = (a0 + 2066 * ui) >> 10;
        ri = ri > 255 ? 255 : ri < 0 ? 0 : ri;
        gi = gi > 255 ? 255 : gi < 0 ? 0 : gi;
        bi = bi > 255 ? 255 : bi < 0 ? 0 : bi;
        outData[wc++] = (ri - normMeanRm255) / normStdRm255;
        outData[wc++] = (gi - normMeanGm255) / normStdGm255;
        outData[wc++] = (bi - normMeanBm255) / normStdBm255;
      }
    }
  } else {
    jclass Exception = jniEnv->FindClass("java/lang/IllegalArgumentException");
    jniEnv->ThrowNew(Exception, "Illegal memory format code");
  }
}
} // namespace pytorch_vision_jni

JNIEXPORT jint JNI_OnLoad(JavaVM* vm, void*) {
  JNIEnv* env;
  if (vm->GetEnv(reinterpret_cast<void**>(&env), JNI_VERSION_1_6) != JNI_OK) {
    return JNI_ERR;
  }

  jclass c =
      env->FindClass("org/pytorch/torchvision/TensorImageUtils$NativePeer");
  if (c == nullptr) {
    return JNI_ERR;
  }

  static const JNINativeMethod methods[] = {
      {"imageYUV420CenterCropToFloatBuffer",
       "(Ljava/nio/ByteBuffer;IILjava/nio/ByteBuffer;Ljava/nio/ByteBuffer;IIIIIII[F[FLjava/nio/Buffer;II)V",
       (void*)pytorch_vision_jni::imageYUV420CenterCropToFloatBuffer},
  };
  int rc = env->RegisterNatives(
      c, methods, sizeof(methods) / sizeof(JNINativeMethod));

  if (rc != JNI_OK) {
    return rc;
  }

  return JNI_VERSION_1_6;
}