bangc-ops/core/tool.cpp

/*************************************************************************
 * Copyright (C) [2022] by Cambricon, Inc.
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the
 * "Software"), to deal in the Software without restriction, including
 * without limitation the rights to use, copy, modify, merge, publish,
 * distribute, sublicense, and/or sell copies of the Software, and to
 * permit persons to whom the Software is furnished to do so, subject to
 * the following conditions:
 *
 * The above copyright notice and this permission notice shall be included
 * in all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
 * IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
 * CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
 *************************************************************************/
#include <errno.h>
#include <sys/stat.h>
#include <sys/types.h>
#include <string>

#include "core/tool.h"
#include "core/logging.h"

#define INT16_BITWIDTH 16

namespace mluop {
mluOpStatus_t castDtypeToBitwidth(mluOpDataType_t quantize_dtype,
                                  int *bitwidth) {
  if (bitwidth == NULL) {
    LOG(ERROR) << "[castDtypeToBitwidth]:The pointer of bitwidth is NULL.";
    return MLUOP_STATUS_BAD_PARAM;
  }

  if (quantize_dtype == MLUOP_DTYPE_INT8) {
    *bitwidth = 8;
  } else if (quantize_dtype == MLUOP_DTYPE_INT16) {
    *bitwidth = 16;
  } else {
    LOG(ERROR) << "[castDtypeToBitwidth]:quantize_dtype is not supported, it "
                  "supports int8, int16.";
    return MLUOP_STATUS_NOT_SUPPORTED;
  }

  return MLUOP_STATUS_SUCCESS;
}

mluOpStatus_t getPosition(float *input, size_t num, mluOpDataType_t datatype,
                          int *position) {
  if (input == NULL) {
    LOG(ERROR) << "[getPosition]:The pointer of input is NULL.";
    return MLUOP_STATUS_BAD_PARAM;
  }
  if (position == NULL) {
    LOG(ERROR) << "[getPosition]:The pointer of position is NULL.";
    return MLUOP_STATUS_BAD_PARAM;
  }
  if (num == 0) {
    LOG(ERROR)
        << "[getPosition]:Input num is wrong, it must be greater than 0.";
    return MLUOP_STATUS_BAD_PARAM;
  }

  int bitwidth = 8;
  if (datatype == MLUOP_DTYPE_INT8) {
    bitwidth = 8;
  } else if (datatype == MLUOP_DTYPE_INT16) {
    bitwidth = 16;
  } else {
    LOG(ERROR) << "[getPosition]:Input data type is not supported.";
    return MLUOP_STATUS_BAD_PARAM;
  }

  // Formula: position = floor(log2(absmax) - (bitwidth - 2)))
  float absmax = std::fabs(input[0]);
  for (size_t index = 0; index < num; ++index) {
    if (std::fabs(input[index]) > absmax) absmax = std::fabs(input[index]);
  }

  if (absmax == 0) {
    *position = 0;
  } else {
    *position =
        static_cast<int>(std::floor(std::log2(absmax)) - (bitwidth - 2));
  }

  return MLUOP_STATUS_SUCCESS;
}

mluOpStatus_t getPositionAndScale(float *input, size_t num,
                                  mluOpDataType_t datatype, int *position,
                                  float *scale) {
  if (input == NULL) {
    LOG(ERROR) << "[getPositionAndScale]:The pointer of input is NULL.";
    return MLUOP_STATUS_BAD_PARAM;
  }
  if (num == 0) {
    LOG(ERROR)
        << "[getPositionAndScale]:Input num is 0, it must be greater than 0.";
    return MLUOP_STATUS_BAD_PARAM;
  }
  if (position == NULL) {
    LOG(ERROR) << "[getPositionAndScale]:The pointer of position is NULL.";
    return MLUOP_STATUS_BAD_PARAM;
  }
  if (scale == NULL) {
    LOG(ERROR) << "[getPositionAndScale]:The pointer of scale is NULL.";
    return MLUOP_STATUS_BAD_PARAM;
  }

  int bitwidth = 8;
  if (datatype == MLUOP_DTYPE_INT8) {
    bitwidth = 8;
  } else if (datatype == MLUOP_DTYPE_INT16) {
    bitwidth = 16;
  } else {
    LOG(ERROR) << "[getPositionAndScale]:Input data type is not supported.";
    return MLUOP_STATUS_BAD_PARAM;
  }

  int scale_var = std::pow(2, bitwidth - 1) - 1;
  float max_data = std::fabs(input[0]);
  for (size_t index = 0; index < num; ++index) {
    if (std::fabs(input[index]) > max_data) max_data = std::fabs(input[index]);
  }
  if (max_data == 0) {
    *position = 0;
    *scale = 1.0;
  } else if (bitwidth != 31) {
    *position =
        static_cast<int>(std::floor(std::log2(max_data)) - (bitwidth - 2));
    *scale = static_cast<float>(std::pow(2, *position) * scale_var / max_data);
  } else {
    *position =
        static_cast<int>(std::floor(std::log2(max_data)) - (bitwidth - 2));
    *scale = 1.0;
  }

  return MLUOP_STATUS_SUCCESS;
}

mluOpStatus_t getPositionScaleAndOffset(float *input, size_t num,
                                        mluOpDataType_t datatype, int *position,
                                        float *scale, int *offset) {
  if (input == NULL) {
    LOG(ERROR) << "[getPositionScaleAndOffset]:The pointer of input is NULL.";
    return MLUOP_STATUS_BAD_PARAM;
  }
  if (num == 0) {
    LOG(ERROR) << "[getPositionScaleAndOffset]:Input num is 0, it must be "
                  "greater than 0.";
    return MLUOP_STATUS_BAD_PARAM;
  }
  if (position == NULL) {
    LOG(ERROR)
        << "[getPositionScaleAndOffset]:The pointer of position is NULL.";
    return MLUOP_STATUS_BAD_PARAM;
  }
  if (scale == NULL) {
    LOG(ERROR) << "[getPositionScaleAndOffset]:The pointer of scale is NULL.";
    return MLUOP_STATUS_BAD_PARAM;
  }
  if (offset == NULL) {
    LOG(ERROR) << "[getPositionScaleAndOffset]:The pointer of offset is NULL.";
    return MLUOP_STATUS_BAD_PARAM;
  }

  int bitwidth = 8;
  if (datatype == MLUOP_DTYPE_INT8) {
    bitwidth = 8;
  } else if (datatype == MLUOP_DTYPE_INT16) {
    bitwidth = 16;
  } else {
    LOG(ERROR)
        << "[getPositionScaleAndOffset]:input data type is not supported.";
    return MLUOP_STATUS_BAD_PARAM;
  }
  float max_data = input[0];
  float min_data = input[0];
  for (size_t i = 0; i < num; ++i) {
    max_data = max_data > input[i] ? max_data : input[i];
    min_data = min_data < input[i] ? min_data : input[i];
  }

  max_data = max_data > 0 ? max_data : 0;
  min_data = min_data < 0 ? min_data : 0;

  if (max_data == min_data) {
    *position = 0;
    *scale = 1;
    *offset = 0;
  } else {
    *position = (int)(floorf(log2f(max_data - min_data)) - (bitwidth - 1));
    *scale =
        powf(2, *position) * (powf(2, bitwidth) - 1) / (max_data - min_data);
    *offset =
        (int)roundf(-powf(2, bitwidth - 1) -
                    min_data * (powf(2, bitwidth) - 1) / (max_data - min_data));
  }

  return MLUOP_STATUS_SUCCESS;
}

int16_t castFloat32ToHalf(float src) {
  /**
   * @desc:
   *  convert a number form `float32` to `int16_t(float16)`.
   * @param:
   *  a nubmer of type `float32`
   * @return:
   *  number of `int16_t`.
   * **/
  const int fs_shift = 31;
  const int fe_shift = 23;
  const int fe_mark = 0xff;
  const int hs_shift = 15;
  const int he_shift = 10;
  int *in1 = (int *)&src;
  int in = *in1;
  int sign = in >> fs_shift;
  int exp = ((in >> fe_shift) & fe_mark) - 127;
  int denorm = 0;
  int eff = 0;
  int g = 0;                              // for round
  if ((exp == 128) && (in & 0x7fffff)) {  // NaN
    exp = 0x1f - 15;
    eff = 0x200;
  } else if (exp >= 16) {
    exp = 0xf;
    eff = 0x3ff;
  } else if (exp >= -14) {
    g = (in >> 12) & 1;
    eff = (in >> 13) & 0x3ff;
  } else if (exp >= -24) {
    g = (((in & 0x7fffff) | 0x800000) >> (-exp - 2)) & 1;
    eff = (((in & 0x7fffff) | 0x800000) >> (-exp - 1)) & 0x3ff;
    denorm = 1;
    exp = 0;
  } else {
    exp = 0;
    denorm = 1;
    eff = (in & 0x7fffffff) ? 1 : 0;
  }
  eff += g;  // round
  exp = (denorm == 1) ? exp : (exp + 15);
  int result = (sign << hs_shift) + (exp << he_shift) + eff;
  return result;
}

float castHalfToFloat32(int16_t src) {
  if (sizeof(int16_t) == 2) {
    int re = src;
    float f = 0.;
    int sign = (re >> 15) ? (-1) : 1;
    int exp = (re >> 10) & 0x1f;
    int eff = re & 0x3ff;
    float half_max = 65504.;
    float half_min = -65504.;  // or to be defined as infinity
    if (exp == 0x1f && eff) {
      // when half is nan, float also return nan, reserve sign bit
      int tmp = (sign > 0) ? 0xffffffff : 0x7fffffff;
      return *(float *)&tmp;
    } else if (exp == 0x1f && sign == 1) {
      // add upper bound of half. 0x7bff： 0 11110 1111111111 =  65504
      return half_max;
    } else if (exp == 0x1f && sign == -1) {
      // add lower bound of half. 0xfbff： 1 11110 1111111111 = -65504
      return half_min;
    }
    if (exp > 0) {
      exp -= 15;
      eff = eff | 0x400;
    } else {
      exp = -14;
    }
    int sft;
    sft = exp - 10;
    if (sft < 0) {
      f = (float)sign * eff / (1 << (-sft));
    } else {
      f = ((float)sign) * (1 << sft) * eff;
    }
    return f;
  } else if (sizeof(int16_t) == 4) {
    // using float
    return src;
  }
}

int mkdirIfNotExist(const char *pathname) {
  struct stat dir_stat = {};
  if (stat(pathname, &dir_stat) != 0) {
    if (mkdir(pathname, 0777) != 0) {
      return errno;
    }
    return 0;
  } else if (!S_ISDIR(dir_stat.st_mode)) {
    return ENOTDIR;
  }
  return 0;
}

int mkdirRecursive(const char *pathname) {
  // let caller ensure pathname is not null
  const char path_token = '/';
  size_t pos = 0;
  const std::string pathname_view(pathname);
  while (pos < pathname_view.size()) {
    auto find_path_token = pathname_view.find(path_token, pos);
    if (find_path_token == std::string::npos) {
      return mkdirIfNotExist(pathname_view.c_str());
    }
    int ret =
        mkdirIfNotExist(pathname_view.substr(0, find_path_token + 1).c_str());
    if (ret) return ret;
    pos = find_path_token + 1;
  }
  return 0;
}

uint64_t getUintEnvVar(const std::string &str, uint64_t default_para) {
  const char *env_raw_ptr = std::getenv(str.c_str());
  if (env_raw_ptr == nullptr) {
    return default_para;
  }

  uint64_t env_int_var = default_para;
  bool is_digital = true;
  for (size_t i = 0; env_raw_ptr[i] != '\0'; i++) {
    if (i == 0 && (env_raw_ptr[0] == '-' || env_raw_ptr[0] == '+')) continue;
    if (std::isdigit(env_raw_ptr[i]) == 0) {
      is_digital = false;
      break;
    }
  }
  if (!is_digital) {
    LOG(WARNING) << str << ": " << env_raw_ptr
                 << " is not digital, uses default value " << default_para
                 << ".";
  } else {
    env_int_var = strtoull(env_raw_ptr, nullptr, 10);
  }

  return env_int_var;
}

std::string getStringEnvVar(const std::string &str, std::string default_para) {
  const char *env_raw_ptr = std::getenv(str.c_str());
  if (env_raw_ptr == nullptr) {
    return default_para;
  }
  std::string env_var = std::string(env_raw_ptr);
  return env_var;
}

bool getBoolEnvVar(const std::string &str, bool default_para) {
  const char *env_raw_ptr = std::getenv(str.c_str());
  if (env_raw_ptr == nullptr) {
    return default_para;
  }
  std::string env_var = std::string(env_raw_ptr);
  std::transform(env_var.begin(), env_var.end(), env_var.begin(), ::toupper);
  return (env_var == "1" || env_var == "ON" || env_var == "YES" ||
          env_var == "TRUE");
}
}  // namespace mluop